diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,10 +1,10 @@ { - "best_global_step": 4700, - "best_metric": 0.6361829025844931, - "best_model_checkpoint": "./bert-philosophy-classifier/checkpoint-4000", - "epoch": 19.771863117870723, + "best_global_step": 2900, + "best_metric": 0.5787694388100068, + "best_model_checkpoint": "./bert-philosophy-classifier/checkpoint-2000", + "epoch": 11.971830985915492, "eval_steps": 100, - "global_step": 5200, + "global_step": 3400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -12,41615 +12,29085 @@ { "epoch": 0, "step": 0, - "train/classification_loss": 0.7054187655448914, - "train/contrastive_loss": 9.865852355957031, - "train/negative_loss": 9.865808486938477, + "train/classification_loss": 0.6910466551780701, + "train/contrastive_loss": 8.255268096923828, + "train/negative_loss": 8.255146026611328, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 4.3711199396057054e-05, - "train/total_loss": 2.678589344024658 + "train/positive_loss": 0.00012198019248899072, + "train/total_loss": 2.3421003818511963 }, { "epoch": 0, "step": 0, - "train/classification_loss": 0.6973287463188171, - "train/contrastive_loss": 9.269636154174805, - "train/negative_loss": 9.269482612609863, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.00015397879178635776, - "train/total_loss": 2.551255941390991 + "train/classification_loss": 0.6955318450927734, + "train/contrastive_loss": 8.37961196899414, + "train/negative_loss": 8.379453659057617, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.00015867262845858932, + "train/total_loss": 2.3714542388916016 }, { - "epoch": 0.19011406844106463, - "grad_norm": 15.935681343078613, + "epoch": 0.176056338028169, + "grad_norm": 16.515756607055664, "learning_rate": 9.4e-06, - "loss": 3.8105, + "loss": 3.5924, "step": 50 }, { - "epoch": 0.19011406844106463, + "epoch": 0.176056338028169, "step": 50, - "train/classification_loss": 0.6410624384880066, - "train/contrastive_loss": 2.2392566204071045, - "train/negative_loss": 1.8866918087005615, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.35256490111351013, - "train/total_loss": 1.0889137983322144 + "train/classification_loss": 0.6504760384559631, + "train/contrastive_loss": 2.0566799640655518, + "train/negative_loss": 2.038007974624634, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.01867193542420864, + "train/total_loss": 1.0618120431900024 }, { - "epoch": 0.19011406844106463, + "epoch": 0.176056338028169, "step": 50, - "train/classification_loss": 0.6499760746955872, - "train/contrastive_loss": 1.537755012512207, - "train/negative_loss": 1.3869619369506836, - "train/num_negatives": 22, - "train/num_positives": 34, - "train/positive_loss": 0.15079309046268463, - "train/total_loss": 0.9575270414352417 + "train/classification_loss": 0.6553352475166321, + "train/contrastive_loss": 2.5260558128356934, + "train/negative_loss": 2.4801580905914307, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.04589761793613434, + "train/total_loss": 1.1605464220046997 }, { - "epoch": 0.38022813688212925, - "grad_norm": 22.162322998046875, + "epoch": 0.352112676056338, + "grad_norm": 15.680583953857422, "learning_rate": 1.94e-05, - "loss": 1.9157, + "loss": 1.9545, "step": 100 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5141388773918152, - "train/contrastive_loss": 2.5344395637512207, - "train/negative_loss": 2.2693448066711426, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.2650948464870453, - "train/total_loss": 1.021026849746704 + "train/classification_loss": 0.5292062163352966, + "train/contrastive_loss": 2.306614637374878, + "train/negative_loss": 2.2695488929748535, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.037065789103507996, + "train/total_loss": 0.9905291795730591 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5132154226303101, - "train/contrastive_loss": 2.315289258956909, - "train/negative_loss": 1.9013853073120117, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.4139039218425751, - "train/total_loss": 0.9762732982635498 + "train/classification_loss": 0.5466294288635254, + "train/contrastive_loss": 1.9586219787597656, + "train/negative_loss": 1.9250495433807373, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.033572472631931305, + "train/total_loss": 0.9383538365364075 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49959126114845276, - "train/contrastive_loss": 2.025355815887451, - "train/negative_loss": 1.4486807584762573, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.5766750574111938, - "train/total_loss": 0.9046624302864075 + "train/classification_loss": 0.5346500873565674, + "train/contrastive_loss": 1.781119704246521, + "train/negative_loss": 1.5406951904296875, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.24042446911334991, + "train/total_loss": 0.8908740282058716 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5000876188278198, - "train/contrastive_loss": 2.4203708171844482, - "train/negative_loss": 2.1490285396575928, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.27134227752685547, - "train/total_loss": 0.9841617941856384 + "train/classification_loss": 0.5251791477203369, + "train/contrastive_loss": 3.1425154209136963, + "train/negative_loss": 2.693556785583496, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4489586651325226, + "train/total_loss": 1.1536822319030762 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5278957486152649, - "train/contrastive_loss": 1.8679933547973633, - "train/negative_loss": 1.3538023233413696, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5141909718513489, - "train/total_loss": 0.9014943838119507 + "train/classification_loss": 0.5305714011192322, + "train/contrastive_loss": 3.5068647861480713, + "train/negative_loss": 3.474233388900757, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.03263139724731445, + "train/total_loss": 1.2319443225860596 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5064294934272766, - "train/contrastive_loss": 1.893783450126648, - "train/negative_loss": 1.6102145910263062, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.2835688889026642, - "train/total_loss": 0.8851861953735352 + "train/classification_loss": 0.5261136889457703, + "train/contrastive_loss": 2.0268311500549316, + "train/negative_loss": 1.752275824546814, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.2745553255081177, + "train/total_loss": 0.9314799308776855 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5230724215507507, - "train/contrastive_loss": 3.0714101791381836, - "train/negative_loss": 2.6625325679779053, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.4088776707649231, - "train/total_loss": 1.1373544931411743 + "train/classification_loss": 0.5449552536010742, + "train/contrastive_loss": 1.596300721168518, + "train/negative_loss": 1.2735298871994019, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.3227708041667938, + "train/total_loss": 0.8642153739929199 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5051161646842957, - "train/contrastive_loss": 2.2798073291778564, - "train/negative_loss": 1.6065303087234497, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.673276960849762, - "train/total_loss": 0.9610776305198669 + "train/classification_loss": 0.5408021211624146, + "train/contrastive_loss": 1.4297927618026733, + "train/negative_loss": 1.4292274713516235, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0005652713589370251, + "train/total_loss": 0.8267606496810913 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.4931166470050812, - "train/contrastive_loss": 1.994917869567871, - "train/negative_loss": 1.9571514129638672, + "train/classification_loss": 0.546276867389679, + "train/contrastive_loss": 1.0722688436508179, + "train/negative_loss": 1.0496809482574463, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.03776644542813301, - "train/total_loss": 0.8921002149581909 + "train/positive_loss": 0.022587856277823448, + "train/total_loss": 0.7607306241989136 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.518193781375885, - "train/contrastive_loss": 3.3919193744659424, - "train/negative_loss": 2.9458096027374268, + "train/classification_loss": 0.5323413610458374, + "train/contrastive_loss": 2.9199142456054688, + "train/negative_loss": 1.6162124872207642, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.4461098313331604, - "train/total_loss": 1.1965776681900024 + "train/num_positives": 14, + "train/positive_loss": 1.3037017583847046, + "train/total_loss": 1.1163241863250732 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5106610655784607, - "train/contrastive_loss": 1.5425939559936523, - "train/negative_loss": 1.2229632139205933, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3196307122707367, - "train/total_loss": 0.819179892539978 + "train/classification_loss": 0.5450893044471741, + "train/contrastive_loss": 2.1610963344573975, + "train/negative_loss": 2.000896453857422, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.1601998507976532, + "train/total_loss": 0.9773085713386536 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.501491129398346, - "train/contrastive_loss": 2.483175039291382, - "train/negative_loss": 1.9951627254486084, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.4880124032497406, - "train/total_loss": 0.9981261491775513 + "train/classification_loss": 0.5373836755752563, + "train/contrastive_loss": 1.8006857633590698, + "train/negative_loss": 1.7946306467056274, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.006055121775716543, + "train/total_loss": 0.8975208401679993 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5075777173042297, - "train/contrastive_loss": 3.8742496967315674, - "train/negative_loss": 3.786134719848633, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.08811492472887039, - "train/total_loss": 1.2824276685714722 + "train/classification_loss": 0.523068904876709, + "train/contrastive_loss": 3.6596007347106934, + "train/negative_loss": 3.1865477561950684, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.47305306792259216, + "train/total_loss": 1.2549891471862793 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5088307857513428, - "train/contrastive_loss": 1.9482722282409668, - "train/negative_loss": 1.4511663913726807, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.49710583686828613, - "train/total_loss": 0.8984852433204651 + "train/classification_loss": 0.5393645167350769, + "train/contrastive_loss": 2.5353968143463135, + "train/negative_loss": 2.22615909576416, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.30923765897750854, + "train/total_loss": 1.0464439392089844 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49460119009017944, - "train/contrastive_loss": 2.484555721282959, - "train/negative_loss": 2.004930019378662, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.4796257019042969, - "train/total_loss": 0.9915122985839844 + "train/classification_loss": 0.5152075290679932, + "train/contrastive_loss": 3.255272626876831, + "train/negative_loss": 2.8025577068328857, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.4527149796485901, + "train/total_loss": 1.166262149810791 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5063183903694153, - "train/contrastive_loss": 1.7020066976547241, - "train/negative_loss": 1.4744956493377686, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.22751109302043915, - "train/total_loss": 0.8467197418212891 + "train/classification_loss": 0.532563328742981, + "train/contrastive_loss": 2.4751503467559814, + "train/negative_loss": 1.9839431047439575, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.49120721220970154, + "train/total_loss": 1.0275933742523193 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5180426836013794, - "train/contrastive_loss": 2.3781521320343018, - "train/negative_loss": 2.124603748321533, - "train/num_negatives": 40, + "train/classification_loss": 0.5331189036369324, + "train/contrastive_loss": 2.0612425804138184, + "train/negative_loss": 1.8743646144866943, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.25354844331741333, - "train/total_loss": 0.9936730861663818 + "train/positive_loss": 0.1868780106306076, + "train/total_loss": 0.9453674554824829 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5121698379516602, - "train/contrastive_loss": 2.293426036834717, - "train/negative_loss": 1.8747484683990479, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.4186776280403137, - "train/total_loss": 0.9708550572395325 + "train/classification_loss": 0.5387558937072754, + "train/contrastive_loss": 3.6453282833099365, + "train/negative_loss": 3.446204662322998, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.19912365078926086, + "train/total_loss": 1.2678215503692627 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5130935311317444, - "train/contrastive_loss": 2.1441965103149414, - "train/negative_loss": 1.9577550888061523, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.1864413619041443, - "train/total_loss": 0.9419327974319458 + "train/classification_loss": 0.5483106374740601, + "train/contrastive_loss": 1.8980530500411987, + "train/negative_loss": 1.8654059171676636, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.032647132873535156, + "train/total_loss": 0.9279212951660156 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5037055611610413, - "train/contrastive_loss": 2.3802385330200195, - "train/negative_loss": 2.0378806591033936, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.34235790371894836, - "train/total_loss": 0.9797532558441162 + "train/classification_loss": 0.5107576251029968, + "train/contrastive_loss": 3.270677328109741, + "train/negative_loss": 3.239260673522949, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.03141666576266289, + "train/total_loss": 1.1648931503295898 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.519368052482605, - "train/contrastive_loss": 3.63668155670166, - "train/negative_loss": 2.4528391361236572, - "train/num_negatives": 44, + "train/classification_loss": 0.5458145141601562, + "train/contrastive_loss": 1.5782126188278198, + "train/negative_loss": 1.5090008974075317, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.1838423013687134, - "train/total_loss": 1.246704339981079 + "train/positive_loss": 0.0692116767168045, + "train/total_loss": 0.8614570498466492 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5339018106460571, - "train/contrastive_loss": 2.3565452098846436, - "train/negative_loss": 2.3150925636291504, - "train/num_negatives": 44, + "train/classification_loss": 0.5230406522750854, + "train/contrastive_loss": 2.8396332263946533, + "train/negative_loss": 2.7991995811462402, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.04145267978310585, - "train/total_loss": 1.0052108764648438 + "train/positive_loss": 0.04043358564376831, + "train/total_loss": 1.0909672975540161 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5002714991569519, - "train/contrastive_loss": 2.302501916885376, - "train/negative_loss": 1.557116150856018, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.7453858256340027, - "train/total_loss": 0.960771918296814 + "train/classification_loss": 0.5388726592063904, + "train/contrastive_loss": 2.4029741287231445, + "train/negative_loss": 2.341367721557617, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.06160643696784973, + "train/total_loss": 1.0194674730300903 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49764755368232727, - "train/contrastive_loss": 1.544675350189209, - "train/negative_loss": 1.3218947649002075, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.22278054058551788, - "train/total_loss": 0.8065826296806335 + "train/classification_loss": 0.5483464598655701, + "train/contrastive_loss": 2.159550905227661, + "train/negative_loss": 1.6986929178237915, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.46085792779922485, + "train/total_loss": 0.9802566766738892 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.4848215878009796, - "train/contrastive_loss": 1.93720543384552, - "train/negative_loss": 1.576495885848999, + "train/classification_loss": 0.5432572960853577, + "train/contrastive_loss": 1.7347164154052734, + "train/negative_loss": 1.6608059406280518, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.360709547996521, - "train/total_loss": 0.872262716293335 + "train/num_positives": 10, + "train/positive_loss": 0.0739104300737381, + "train/total_loss": 0.8902006149291992 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5225034356117249, - "train/contrastive_loss": 1.8692991733551025, - "train/negative_loss": 0.7269907593727112, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1423084735870361, - "train/total_loss": 0.8963632583618164 + "train/classification_loss": 0.5226185917854309, + "train/contrastive_loss": 2.3534626960754395, + "train/negative_loss": 2.00205659866333, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.35140615701675415, + "train/total_loss": 0.9933111667633057 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5088687539100647, - "train/contrastive_loss": 2.0347771644592285, - "train/negative_loss": 1.938789963722229, + "train/classification_loss": 0.5365185737609863, + "train/contrastive_loss": 4.000570297241211, + "train/negative_loss": 2.8349084854125977, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.09598712623119354, - "train/total_loss": 0.9158241748809814 + "train/num_positives": 4, + "train/positive_loss": 1.1656616926193237, + "train/total_loss": 1.3366327285766602 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5115606188774109, - "train/contrastive_loss": 3.5256614685058594, - "train/negative_loss": 2.547478675842285, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.9781829118728638, - "train/total_loss": 1.2166929244995117 + "train/classification_loss": 0.5436530709266663, + "train/contrastive_loss": 2.752227306365967, + "train/negative_loss": 2.3868792057037354, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.36534813046455383, + "train/total_loss": 1.0940985679626465 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5083501935005188, - "train/contrastive_loss": 2.0617685317993164, - "train/negative_loss": 1.7738186120986938, - "train/num_negatives": 40, + "train/classification_loss": 0.5252662301063538, + "train/contrastive_loss": 3.149979591369629, + "train/negative_loss": 2.1100027561187744, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.28794994950294495, - "train/total_loss": 0.9207038879394531 + "train/positive_loss": 1.0399768352508545, + "train/total_loss": 1.1552622318267822 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5134417414665222, - "train/contrastive_loss": 2.7064294815063477, - "train/negative_loss": 2.2278876304626465, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.478541761636734, - "train/total_loss": 1.0547276735305786 + "train/classification_loss": 0.53873211145401, + "train/contrastive_loss": 2.7749056816101074, + "train/negative_loss": 2.756542205810547, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.01836339570581913, + "train/total_loss": 1.0937132835388184 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5130801796913147, - "train/contrastive_loss": 2.2027816772460938, - "train/negative_loss": 1.353335976600647, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8494455814361572, - "train/total_loss": 0.9536365270614624 + "train/classification_loss": 0.5252187848091125, + "train/contrastive_loss": 1.385758876800537, + "train/negative_loss": 1.364824652671814, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.020934201776981354, + "train/total_loss": 0.802370548248291 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5094675421714783, - "train/contrastive_loss": 2.494227647781372, - "train/negative_loss": 2.1596906185150146, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.33453696966171265, - "train/total_loss": 1.0083130598068237 + "train/classification_loss": 0.5307956337928772, + "train/contrastive_loss": 2.145063638687134, + "train/negative_loss": 1.7865453958511353, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3585182726383209, + "train/total_loss": 0.959808349609375 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5282798409461975, - "train/contrastive_loss": 2.160306692123413, - "train/negative_loss": 2.1407148838043213, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.019591866061091423, - "train/total_loss": 0.960341215133667 + "train/classification_loss": 0.5319681763648987, + "train/contrastive_loss": 2.523132085800171, + "train/negative_loss": 2.286376714706421, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.2367553412914276, + "train/total_loss": 1.0365946292877197 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5149160027503967, - "train/contrastive_loss": 2.3513805866241455, - "train/negative_loss": 2.0907909870147705, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.2605895400047302, - "train/total_loss": 0.9851921200752258 + "train/classification_loss": 0.5492977499961853, + "train/contrastive_loss": 2.4941790103912354, + "train/negative_loss": 1.497723937034607, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.9964550733566284, + "train/total_loss": 1.0481336116790771 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5017629861831665, - "train/contrastive_loss": 2.2446932792663574, - "train/negative_loss": 1.3195736408233643, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.9251196384429932, - "train/total_loss": 0.9507016539573669 + "train/classification_loss": 0.5363556146621704, + "train/contrastive_loss": 1.8118360042572021, + "train/negative_loss": 1.7267634868621826, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.08507253974676132, + "train/total_loss": 0.8987228274345398 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.4931255877017975, - "train/contrastive_loss": 5.117409706115723, - "train/negative_loss": 2.9382598400115967, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.179149627685547, - "train/total_loss": 1.5166075229644775 + "train/classification_loss": 0.5309258699417114, + "train/contrastive_loss": 2.3783364295959473, + "train/negative_loss": 2.352630376815796, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.025705955922603607, + "train/total_loss": 1.0065932273864746 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5013383030891418, - "train/contrastive_loss": 2.5799336433410645, - "train/negative_loss": 2.2291648387908936, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.3507687747478485, - "train/total_loss": 1.0173250436782837 + "train/classification_loss": 0.5422551035881042, + "train/contrastive_loss": 1.544332504272461, + "train/negative_loss": 1.3956546783447266, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.14867788553237915, + "train/total_loss": 0.8511216044425964 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5124106407165527, - "train/contrastive_loss": 2.7270424365997314, - "train/negative_loss": 2.076951503753662, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.6500909924507141, - "train/total_loss": 1.057819128036499 + "train/classification_loss": 0.5545170903205872, + "train/contrastive_loss": 2.345576047897339, + "train/negative_loss": 2.2640533447265625, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0815226212143898, + "train/total_loss": 1.023632287979126 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5080915689468384, - "train/contrastive_loss": 1.804985523223877, - "train/negative_loss": 1.737541913986206, - "train/num_negatives": 46, + "train/classification_loss": 0.5410986542701721, + "train/contrastive_loss": 2.3546016216278076, + "train/negative_loss": 2.3232460021972656, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.031355615705251694, + "train/total_loss": 1.0120189189910889 + }, + { + "epoch": 0.352112676056338, + "step": 100, + "train/classification_loss": 0.5399579405784607, + "train/contrastive_loss": 1.6408647298812866, + "train/negative_loss": 1.4657557010650635, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.06744355708360672, - "train/total_loss": 0.8690886497497559 + "train/positive_loss": 0.17510902881622314, + "train/total_loss": 0.8681309223175049 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.501038670539856, - "train/contrastive_loss": 2.1530323028564453, - "train/negative_loss": 2.1294708251953125, + "train/classification_loss": 0.5184195637702942, + "train/contrastive_loss": 1.8366289138793945, + "train/negative_loss": 1.2438676357269287, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.02356150932610035, - "train/total_loss": 0.9316451549530029 + "train/num_positives": 10, + "train/positive_loss": 0.592761218547821, + "train/total_loss": 0.8857453465461731 + }, + { + "epoch": 0.352112676056338, + "step": 100, + "train/classification_loss": 0.5257993936538696, + "train/contrastive_loss": 3.42195987701416, + "train/negative_loss": 2.86478328704834, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5571765303611755, + "train/total_loss": 1.2101913690567017 + }, + { + "epoch": 0.352112676056338, + "step": 100, + "train/classification_loss": 0.544603705406189, + "train/contrastive_loss": 2.036705493927002, + "train/negative_loss": 1.905866026878357, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.13083946704864502, + "train/total_loss": 0.9519448280334473 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5054866671562195, - "train/contrastive_loss": 1.8644776344299316, - "train/negative_loss": 1.8193776607513428, + "train/classification_loss": 0.5267763733863831, + "train/contrastive_loss": 1.8731989860534668, + "train/negative_loss": 1.8441189527511597, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.04509993642568588, - "train/total_loss": 0.8783822059631348 + "train/positive_loss": 0.029080014675855637, + "train/total_loss": 0.9014161825180054 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5042749047279358, - "train/contrastive_loss": 1.1298089027404785, - "train/negative_loss": 1.072906255722046, - "train/num_negatives": 36, + "train/classification_loss": 0.5378268957138062, + "train/contrastive_loss": 2.221756935119629, + "train/negative_loss": 1.9916719198226929, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.23008498549461365, + "train/total_loss": 0.9821783304214478 + }, + { + "epoch": 0.352112676056338, + "step": 100, + "train/classification_loss": 0.5418212413787842, + "train/contrastive_loss": 4.279918193817139, + "train/negative_loss": 3.504610300064087, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.05690264701843262, - "train/total_loss": 0.7302367091178894 + "train/positive_loss": 0.7753080129623413, + "train/total_loss": 1.3978049755096436 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.510039210319519, - "train/contrastive_loss": 2.489720344543457, - "train/negative_loss": 2.273312568664551, + "train/classification_loss": 0.5320029854774475, + "train/contrastive_loss": 2.450683832168579, + "train/negative_loss": 1.5620760917663574, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8886077404022217, + "train/total_loss": 1.0221397876739502 + }, + { + "epoch": 0.352112676056338, + "step": 100, + "train/classification_loss": 0.5374838709831238, + "train/contrastive_loss": 2.0769155025482178, + "train/negative_loss": 1.8300950527191162, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.2164078950881958, - "train/total_loss": 1.0079833269119263 + "train/num_positives": 14, + "train/positive_loss": 0.24682042002677917, + "train/total_loss": 0.9528669714927673 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5038439631462097, - "train/contrastive_loss": 3.1949870586395264, - "train/negative_loss": 2.4569616317749023, + "train/classification_loss": 0.5383163094520569, + "train/contrastive_loss": 3.6867856979370117, + "train/negative_loss": 3.633483409881592, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.7380254864692688, - "train/total_loss": 1.1428413391113281 + "train/num_positives": 2, + "train/positive_loss": 0.05330224335193634, + "train/total_loss": 1.2756733894348145 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49796491861343384, - "train/contrastive_loss": 2.2809040546417236, - "train/negative_loss": 1.6373882293701172, + "train/classification_loss": 0.5388382077217102, + "train/contrastive_loss": 2.449093818664551, + "train/negative_loss": 1.6639244556427002, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6435158848762512, - "train/total_loss": 0.9541457295417786 + "train/num_positives": 16, + "train/positive_loss": 0.785169243812561, + "train/total_loss": 1.0286569595336914 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.520788848400116, - "train/contrastive_loss": 2.4642531871795654, - "train/negative_loss": 2.329331159591675, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.13492195308208466, - "train/total_loss": 1.0136394500732422 + "train/classification_loss": 0.5398443937301636, + "train/contrastive_loss": 3.40635085105896, + "train/negative_loss": 3.386542320251465, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.019808607175946236, + "train/total_loss": 1.2211146354675293 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49743562936782837, - "train/contrastive_loss": 1.3867875337600708, - "train/negative_loss": 1.3793987035751343, - "train/num_negatives": 48, + "train/classification_loss": 0.541286826133728, + "train/contrastive_loss": 2.3181488513946533, + "train/negative_loss": 1.805355429649353, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.007388879079371691, - "train/total_loss": 0.7747931480407715 + "train/positive_loss": 0.5127934217453003, + "train/total_loss": 1.0049166679382324 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5120257139205933, - "train/contrastive_loss": 1.8927552700042725, - "train/negative_loss": 1.3099662065505981, + "train/classification_loss": 0.5403976440429688, + "train/contrastive_loss": 1.7116339206695557, + "train/negative_loss": 1.5584475994110107, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.5827890634536743, - "train/total_loss": 0.8905767798423767 + "train/num_positives": 14, + "train/positive_loss": 0.15318630635738373, + "train/total_loss": 0.882724404335022 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.48868438601493835, - "train/contrastive_loss": 2.6628432273864746, - "train/negative_loss": 2.610722541809082, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.052120763808488846, - "train/total_loss": 1.021252989768982 + "train/classification_loss": 0.5545975565910339, + "train/contrastive_loss": 2.685664176940918, + "train/negative_loss": 2.6671087741851807, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.01855549030005932, + "train/total_loss": 1.0917303562164307 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5226226449012756, - "train/contrastive_loss": 1.1362452507019043, - "train/negative_loss": 0.9865681529045105, - "train/num_negatives": 28, + "train/classification_loss": 0.5304739475250244, + "train/contrastive_loss": 1.4997867345809937, + "train/negative_loss": 1.4348959922790527, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.1496771275997162, - "train/total_loss": 0.7498717308044434 + "train/positive_loss": 0.06489069759845734, + "train/total_loss": 0.830431342124939 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.51773601770401, - "train/contrastive_loss": 2.259053945541382, - "train/negative_loss": 1.8771291971206665, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3819248378276825, - "train/total_loss": 0.9695467948913574 + "train/classification_loss": 0.528757631778717, + "train/contrastive_loss": 3.1133694648742676, + "train/negative_loss": 3.069612503051758, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.04375695809721947, + "train/total_loss": 1.1514315605163574 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5040704011917114, - "train/contrastive_loss": 2.4974024295806885, - "train/negative_loss": 2.309147357940674, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.18825499713420868, - "train/total_loss": 1.0035508871078491 + "train/classification_loss": 0.5330578684806824, + "train/contrastive_loss": 1.3456382751464844, + "train/negative_loss": 1.287862777709961, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.05777547508478165, + "train/total_loss": 0.8021855354309082 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5042409896850586, - "train/contrastive_loss": 2.986949920654297, - "train/negative_loss": 2.140775203704834, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8461747765541077, - "train/total_loss": 1.1016309261322021 + "train/classification_loss": 0.5354094505310059, + "train/contrastive_loss": 2.4783427715301514, + "train/negative_loss": 1.6376371383666992, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.8407056331634521, + "train/total_loss": 1.0310779809951782 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.4931391477584839, - "train/contrastive_loss": 3.492546319961548, - "train/negative_loss": 2.964676856994629, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.527869462966919, - "train/total_loss": 1.1916484832763672 + "train/classification_loss": 0.5385649800300598, + "train/contrastive_loss": 2.7976906299591064, + "train/negative_loss": 2.7675998210906982, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.03009072318673134, + "train/total_loss": 1.0981030464172363 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5086107850074768, - "train/contrastive_loss": 2.8950085639953613, - "train/negative_loss": 2.480247974395752, + "train/classification_loss": 0.5312110781669617, + "train/contrastive_loss": 1.37204909324646, + "train/negative_loss": 1.1857126951217651, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.4147605895996094, - "train/total_loss": 1.087612509727478 + "train/num_positives": 16, + "train/positive_loss": 0.18633633852005005, + "train/total_loss": 0.8056209087371826 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49491333961486816, - "train/contrastive_loss": 2.4414398670196533, - "train/negative_loss": 2.3802330493927, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.06120682880282402, - "train/total_loss": 0.9832013249397278 + "train/classification_loss": 0.5352913737297058, + "train/contrastive_loss": 2.8081698417663574, + "train/negative_loss": 2.6742031574249268, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.1339666098356247, + "train/total_loss": 1.0969253778457642 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5205986499786377, - "train/contrastive_loss": 2.997138023376465, - "train/negative_loss": 2.3235912322998047, + "train/classification_loss": 0.5294104218482971, + "train/contrastive_loss": 2.1925151348114014, + "train/negative_loss": 2.1897799968719482, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.6735467910766602, - "train/total_loss": 1.1200263500213623 + "train/num_positives": 2, + "train/positive_loss": 0.0027350601740181446, + "train/total_loss": 0.9679134488105774 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.500521719455719, - "train/contrastive_loss": 3.530078172683716, - "train/negative_loss": 3.499314308166504, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.03076385334134102, - "train/total_loss": 1.2065373659133911 + "train/classification_loss": 0.5238025784492493, + "train/contrastive_loss": 2.6010711193084717, + "train/negative_loss": 2.353334426879883, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.24773679673671722, + "train/total_loss": 1.0440168380737305 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5036959052085876, - "train/contrastive_loss": 2.7629165649414062, - "train/negative_loss": 1.9071204662322998, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.855796217918396, - "train/total_loss": 1.056279182434082 + "train/classification_loss": 0.5400266051292419, + "train/contrastive_loss": 2.8627476692199707, + "train/negative_loss": 2.7112135887145996, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.1515340507030487, + "train/total_loss": 1.1125761270523071 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5036133527755737, - "train/contrastive_loss": 2.094717025756836, - "train/negative_loss": 1.9970005750656128, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.09771650284528732, - "train/total_loss": 0.9225567579269409 + "train/classification_loss": 0.5383491516113281, + "train/contrastive_loss": 4.268233299255371, + "train/negative_loss": 2.231462001800537, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 2.036771059036255, + "train/total_loss": 1.391995906829834 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5122824907302856, - "train/contrastive_loss": 3.5814385414123535, - "train/negative_loss": 2.7314953804016113, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.8499432802200317, - "train/total_loss": 1.2285702228546143 + "train/classification_loss": 0.532766580581665, + "train/contrastive_loss": 2.8463375568389893, + "train/negative_loss": 2.8405442237854004, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.005793261807411909, + "train/total_loss": 1.102034091949463 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5041477680206299, - "train/contrastive_loss": 2.6143274307250977, - "train/negative_loss": 2.0390777587890625, + "train/classification_loss": 0.5443864464759827, + "train/contrastive_loss": 1.849961757659912, + "train/negative_loss": 1.6025692224502563, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.5752497911453247, - "train/total_loss": 1.0270133018493652 + "train/positive_loss": 0.24739256501197815, + "train/total_loss": 0.9143787622451782 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5159657001495361, - "train/contrastive_loss": 1.7917431592941284, - "train/negative_loss": 1.3273086547851562, + "train/classification_loss": 0.529344916343689, + "train/contrastive_loss": 1.9414914846420288, + "train/negative_loss": 1.808849573135376, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.46443453431129456, - "train/total_loss": 0.8743143081665039 + "train/num_positives": 8, + "train/positive_loss": 0.1326419562101364, + "train/total_loss": 0.9176431894302368 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.49786287546157837, - "train/contrastive_loss": 4.343784809112549, - "train/negative_loss": 3.259251356124878, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.0845333337783813, - "train/total_loss": 1.3666198253631592 + "train/classification_loss": 0.5177937150001526, + "train/contrastive_loss": 2.0468740463256836, + "train/negative_loss": 2.005218982696533, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.041655153036117554, + "train/total_loss": 0.9271684885025024 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5126004219055176, - "train/contrastive_loss": 2.384019374847412, - "train/negative_loss": 1.6423149108886719, - "train/num_negatives": 46, + "train/classification_loss": 0.5452139377593994, + "train/contrastive_loss": 1.8783801794052124, + "train/negative_loss": 1.5115289688110352, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.7417045831680298, - "train/total_loss": 0.9894043207168579 + "train/positive_loss": 0.36685118079185486, + "train/total_loss": 0.9208899736404419 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.525465726852417, - "train/contrastive_loss": 1.78139328956604, - "train/negative_loss": 1.78139328956604, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.881744384765625 - }, - { - "epoch": 0.38022813688212925, - "eval_exact_match_accuracy": 0.0, - "eval_hamming_loss": 0.09792717086834733, - "eval_loss": 0.9991987347602844, - "eval_macro_f1": 0.004812834224598931, - "eval_macro_precision": 0.04072398190045249, - "eval_macro_recall": 0.002557544757033248, - "eval_micro_f1": 0.020179372197309416, - "eval_micro_precision": 0.6923076923076923, - "eval_micro_recall": 0.010238907849829351, - "eval_runtime": 2.568, - "eval_samples_per_second": 204.438, - "eval_steps_per_second": 25.701, + "train/classification_loss": 0.5393397212028503, + "train/contrastive_loss": 3.0772385597229004, + "train/negative_loss": 2.4198713302612305, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.6573673486709595, + "train/total_loss": 1.1547874212265015 + }, + { + "epoch": 0.352112676056338, + "eval_exact_match_accuracy": 0.007054673721340388, + "eval_hamming_loss": 0.0991804129059031, + "eval_loss": 1.0206341743469238, + "eval_macro_f1": 0.004705882352941177, + "eval_macro_precision": 0.017077798861480076, + "eval_macro_recall": 0.00272892662219527, + "eval_micro_f1": 0.018480492813141684, + "eval_micro_precision": 0.25, + "eval_micro_recall": 0.009594882729211088, + "eval_runtime": 2.8027, + "eval_samples_per_second": 202.303, + "eval_steps_per_second": 25.332, "step": 100 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5153835415840149, - "train/contrastive_loss": 1.9819175004959106, - "train/negative_loss": 1.3787039518356323, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 0.6032135486602783, - "train/total_loss": 0.9117670059204102 + "train/classification_loss": 0.5403586030006409, + "train/contrastive_loss": 2.3812899589538574, + "train/negative_loss": 1.652747631072998, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.7285423278808594, + "train/total_loss": 1.0166165828704834 }, { - "epoch": 0.38022813688212925, + "epoch": 0.352112676056338, "step": 100, - "train/classification_loss": 0.5005282759666443, - "train/contrastive_loss": 1.6629000902175903, - "train/negative_loss": 1.1018431186676025, + "train/classification_loss": 0.5478186011314392, + "train/contrastive_loss": 1.4490203857421875, + "train/negative_loss": 1.1485689878463745, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.5610569715499878, - "train/total_loss": 0.8331083059310913 + "train/positive_loss": 0.3004514276981354, + "train/total_loss": 0.8376226425170898 }, { - "epoch": 0.5703422053231939, - "grad_norm": 20.521570205688477, - "learning_rate": 1.9992846270928464e-05, - "loss": 1.6098, + "epoch": 0.528169014084507, + "grad_norm": 18.845754623413086, + "learning_rate": 1.9993375616631433e-05, + "loss": 1.6374, "step": 150 }, { - "epoch": 0.5703422053231939, + "epoch": 0.528169014084507, "step": 150, - "train/classification_loss": 0.43018609285354614, - "train/contrastive_loss": 2.8645718097686768, - "train/negative_loss": 1.2329291105270386, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.6316426992416382, - "train/total_loss": 1.0031003952026367 + "train/classification_loss": 0.4399445652961731, + "train/contrastive_loss": 1.8953174352645874, + "train/negative_loss": 1.2232775688171387, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.6720398664474487, + "train/total_loss": 0.8190080523490906 }, { - "epoch": 0.5703422053231939, + "epoch": 0.528169014084507, "step": 150, - "train/classification_loss": 0.40478652715682983, - "train/contrastive_loss": 1.354927897453308, - "train/negative_loss": 1.354927897453308, - "train/num_negatives": 56, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6757720708847046 - }, - { - "epoch": 0.7604562737642585, - "grad_norm": 17.849178314208984, - "learning_rate": 1.9985235920852362e-05, - "loss": 1.433, - "step": 200 + "train/classification_loss": 0.45203354954719543, + "train/contrastive_loss": 2.333707332611084, + "train/negative_loss": 1.3233333826065063, + "train/num_negatives": 28, + "train/num_positives": 20, + "train/positive_loss": 1.0103740692138672, + "train/total_loss": 0.9187750220298767 }, { - "epoch": 0.7604562737642585, - "step": 200, - "train/classification_loss": 0.374879390001297, - "train/contrastive_loss": 2.2762207984924316, - "train/negative_loss": 2.0127594470977783, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.26346147060394287, - "train/total_loss": 0.8301235437393188 + "epoch": 0.704225352112676, + "grad_norm": 22.89767837524414, + "learning_rate": 1.998632840028189e-05, + "loss": 1.4947, + "step": 200 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.35680091381073, - "train/contrastive_loss": 3.0456128120422363, - "train/negative_loss": 2.292947292327881, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.7526654005050659, - "train/total_loss": 0.9659234881401062 + "train/classification_loss": 0.35212618112564087, + "train/contrastive_loss": 2.679692268371582, + "train/negative_loss": 2.5468082427978516, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.13288407027721405, + "train/total_loss": 0.8880646228790283 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3388345539569855, - "train/contrastive_loss": 2.2656548023223877, - "train/negative_loss": 1.487280011177063, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.7783747911453247, - "train/total_loss": 0.7919654846191406 + "train/classification_loss": 0.40419623255729675, + "train/contrastive_loss": 2.1445202827453613, + "train/negative_loss": 2.1230874061584473, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.02143275737762451, + "train/total_loss": 0.8331003189086914 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3411712050437927, - "train/contrastive_loss": 3.0956921577453613, - "train/negative_loss": 2.981250524520874, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.1144416332244873, - "train/total_loss": 0.960309624671936 + "train/classification_loss": 0.36665281653404236, + "train/contrastive_loss": 3.2175021171569824, + "train/negative_loss": 2.35038685798645, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.8671151995658875, + "train/total_loss": 1.0101532936096191 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.37614530324935913, - "train/contrastive_loss": 1.7843455076217651, - "train/negative_loss": 1.6559194326400757, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.12842604517936707, - "train/total_loss": 0.7330144047737122 + "train/classification_loss": 0.3220570683479309, + "train/contrastive_loss": 3.860135793685913, + "train/negative_loss": 3.6707465648651123, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.18938927352428436, + "train/total_loss": 1.0940842628479004 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.35679319500923157, - "train/contrastive_loss": 2.086686849594116, - "train/negative_loss": 1.913096308708191, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.17359061539173126, - "train/total_loss": 0.7741305828094482 + "train/classification_loss": 0.34903034567832947, + "train/contrastive_loss": 4.295506000518799, + "train/negative_loss": 4.278042316436768, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.01746382936835289, + "train/total_loss": 1.2081315517425537 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.383198082447052, - "train/contrastive_loss": 3.2749814987182617, - "train/negative_loss": 2.9826483726501465, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.2923332154750824, - "train/total_loss": 1.0381944179534912 + "train/classification_loss": 0.3510552644729614, + "train/contrastive_loss": 2.4234988689422607, + "train/negative_loss": 2.118229389190674, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.3052694797515869, + "train/total_loss": 0.8357550501823425 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3243286907672882, - "train/contrastive_loss": 1.8737231492996216, - "train/negative_loss": 1.4502716064453125, - "train/num_negatives": 42, + "train/classification_loss": 0.3522025942802429, + "train/contrastive_loss": 2.070845603942871, + "train/negative_loss": 1.6335164308547974, + "train/num_negatives": 36, "train/num_positives": 14, - "train/positive_loss": 0.4234515130519867, - "train/total_loss": 0.699073314666748 + "train/positive_loss": 0.4373290538787842, + "train/total_loss": 0.7663717269897461 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.3764512538909912, + "train/contrastive_loss": 1.995721697807312, + "train/negative_loss": 1.995355486869812, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0003661587543319911, + "train/total_loss": 0.7755956053733826 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3341130018234253, - "train/contrastive_loss": 2.057563543319702, - "train/negative_loss": 2.013054370880127, + "train/classification_loss": 0.3572298586368561, + "train/contrastive_loss": 1.0032556056976318, + "train/negative_loss": 0.9694838523864746, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.04450918361544609, - "train/total_loss": 0.7456257343292236 + "train/positive_loss": 0.033771805465221405, + "train/total_loss": 0.5578809976577759 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.38041070103645325, - "train/contrastive_loss": 3.957752227783203, - "train/negative_loss": 3.40635085105896, + "train/classification_loss": 0.3626837134361267, + "train/contrastive_loss": 3.458970546722412, + "train/negative_loss": 2.631351947784424, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.5514013767242432, - "train/total_loss": 1.1719611883163452 + "train/num_positives": 14, + "train/positive_loss": 0.8276186585426331, + "train/total_loss": 1.0544778108596802 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3478820025920868, - "train/contrastive_loss": 1.4437536001205444, - "train/negative_loss": 1.351671576499939, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.09208199381828308, - "train/total_loss": 0.6366327404975891 + "train/classification_loss": 0.3533361256122589, + "train/contrastive_loss": 1.8334563970565796, + "train/negative_loss": 1.7719533443450928, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.06150306761264801, + "train/total_loss": 0.7200274467468262 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3342229723930359, - "train/contrastive_loss": 2.277858257293701, - "train/negative_loss": 1.8631938695907593, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.41466444730758667, - "train/total_loss": 0.7897946238517761 + "train/classification_loss": 0.3600704073905945, + "train/contrastive_loss": 3.0222949981689453, + "train/negative_loss": 2.7934417724609375, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.22885310649871826, + "train/total_loss": 0.9645293951034546 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3528163731098175, - "train/contrastive_loss": 4.480205535888672, - "train/negative_loss": 4.342519283294678, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.13768641650676727, - "train/total_loss": 1.2488574981689453 + "train/classification_loss": 0.35269612073898315, + "train/contrastive_loss": 5.173518657684326, + "train/negative_loss": 4.742369174957275, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.4311496615409851, + "train/total_loss": 1.3873999118804932 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3457184433937073, - "train/contrastive_loss": 1.9157134294509888, - "train/negative_loss": 1.8943642377853394, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.021349139511585236, - "train/total_loss": 0.7288610935211182 + "train/classification_loss": 0.38129597902297974, + "train/contrastive_loss": 2.7656726837158203, + "train/negative_loss": 2.366760730743408, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.39891207218170166, + "train/total_loss": 0.9344305396080017 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3252256214618683, - "train/contrastive_loss": 2.622037410736084, - "train/negative_loss": 2.2439162731170654, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.3781212270259857, - "train/total_loss": 0.8496330976486206 + "train/classification_loss": 0.3092501163482666, + "train/contrastive_loss": 2.5747292041778564, + "train/negative_loss": 2.5314383506774902, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.043290793895721436, + "train/total_loss": 0.8241959810256958 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3389511704444885, - "train/contrastive_loss": 1.4268876314163208, - "train/negative_loss": 1.3777763843536377, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.04911124333739281, - "train/total_loss": 0.6243287324905396 + "train/classification_loss": 0.3573189377784729, + "train/contrastive_loss": 2.508971929550171, + "train/negative_loss": 2.380729913711548, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.1282421052455902, + "train/total_loss": 0.859113335609436 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36392104625701904, - "train/contrastive_loss": 2.2754504680633545, - "train/negative_loss": 1.9995834827423096, - "train/num_negatives": 40, + "train/classification_loss": 0.34687700867652893, + "train/contrastive_loss": 2.098405599594116, + "train/negative_loss": 2.051146984100342, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.2758670747280121, - "train/total_loss": 0.8190111517906189 + "train/positive_loss": 0.047258712351322174, + "train/total_loss": 0.7665581703186035 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3806126117706299, - "train/contrastive_loss": 2.1837809085845947, - "train/negative_loss": 1.5458462238311768, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.6379346251487732, - "train/total_loss": 0.8173688054084778 + "train/classification_loss": 0.35372182726860046, + "train/contrastive_loss": 3.717986583709717, + "train/negative_loss": 3.0732946395874023, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.6446920037269592, + "train/total_loss": 1.0973191261291504 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.376101553440094, - "train/contrastive_loss": 2.319101572036743, - "train/negative_loss": 2.2875003814697266, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.03160123527050018, - "train/total_loss": 0.8399218320846558 + "train/classification_loss": 0.3786483705043793, + "train/contrastive_loss": 2.3159143924713135, + "train/negative_loss": 2.2949910163879395, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.020923269912600517, + "train/total_loss": 0.8418312668800354 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34527772665023804, - "train/contrastive_loss": 3.263833522796631, - "train/negative_loss": 2.3586740493774414, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.905159592628479, - "train/total_loss": 0.9980444312095642 + "train/classification_loss": 0.3270884156227112, + "train/contrastive_loss": 3.726046323776245, + "train/negative_loss": 3.722228527069092, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.00381774315610528, + "train/total_loss": 1.0722976922988892 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.37274545431137085, - "train/contrastive_loss": 3.119901418685913, - "train/negative_loss": 2.2312264442443848, - "train/num_negatives": 44, + "train/classification_loss": 0.3455738127231598, + "train/contrastive_loss": 1.8412854671478271, + "train/negative_loss": 1.7668914794921875, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.8886749148368835, - "train/total_loss": 0.9967257380485535 + "train/positive_loss": 0.07439402490854263, + "train/total_loss": 0.7138309478759766 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3951014280319214, - "train/contrastive_loss": 2.5472311973571777, - "train/negative_loss": 2.5345542430877686, - "train/num_negatives": 44, + "train/classification_loss": 0.32592976093292236, + "train/contrastive_loss": 2.967134952545166, + "train/negative_loss": 2.961982488632202, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.012677029706537724, - "train/total_loss": 0.9045476913452148 + "train/positive_loss": 0.005152459722012281, + "train/total_loss": 0.9193567633628845 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3374144732952118, - "train/contrastive_loss": 2.064208984375, - "train/negative_loss": 1.3833290338516235, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6808800101280212, - "train/total_loss": 0.7502562999725342 + "train/classification_loss": 0.36154529452323914, + "train/contrastive_loss": 2.2759153842926025, + "train/negative_loss": 2.2604081630706787, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.01550716906785965, + "train/total_loss": 0.8167283535003662 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.32676494121551514, - "train/contrastive_loss": 1.9432333707809448, - "train/negative_loss": 1.1498665809631348, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.7933667898178101, - "train/total_loss": 0.7154116630554199 + "train/classification_loss": 0.3743017017841339, + "train/contrastive_loss": 2.1762869358062744, + "train/negative_loss": 1.659332513809204, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5169544219970703, + "train/total_loss": 0.8095591068267822 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3132694959640503, - "train/contrastive_loss": 2.30549955368042, - "train/negative_loss": 2.201972484588623, + "train/classification_loss": 0.3658154010772705, + "train/contrastive_loss": 1.7418978214263916, + "train/negative_loss": 1.726149320602417, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.10352718085050583, - "train/total_loss": 0.7743694186210632 + "train/num_positives": 10, + "train/positive_loss": 0.015748459845781326, + "train/total_loss": 0.7141950130462646 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.37311795353889465, - "train/contrastive_loss": 1.839597225189209, - "train/negative_loss": 0.8937833309173584, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9458138346672058, - "train/total_loss": 0.7410373687744141 + "train/classification_loss": 0.34862056374549866, + "train/contrastive_loss": 3.6049418449401855, + "train/negative_loss": 2.9295573234558105, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.6753845810890198, + "train/total_loss": 1.0696089267730713 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3552400767803192, - "train/contrastive_loss": 1.8420398235321045, - "train/negative_loss": 1.7596285343170166, + "train/classification_loss": 0.362020343542099, + "train/contrastive_loss": 3.104332208633423, + "train/negative_loss": 3.068046808242798, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.08241124451160431, - "train/total_loss": 0.7236480712890625 + "train/num_positives": 4, + "train/positive_loss": 0.03628542274236679, + "train/total_loss": 0.982886791229248 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36617812514305115, - "train/contrastive_loss": 2.9383108615875244, - "train/negative_loss": 2.6128246784210205, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.3254861831665039, - "train/total_loss": 0.9538402557373047 + "train/classification_loss": 0.3686039447784424, + "train/contrastive_loss": 2.305522918701172, + "train/negative_loss": 2.166105270385742, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.13941775262355804, + "train/total_loss": 0.8297085762023926 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36349165439605713, - "train/contrastive_loss": 2.1111233234405518, - "train/negative_loss": 2.093932867050171, - "train/num_negatives": 40, + "train/classification_loss": 0.3441305160522461, + "train/contrastive_loss": 3.7442047595977783, + "train/negative_loss": 3.075505495071411, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.017190534621477127, - "train/total_loss": 0.7857162952423096 + "train/positive_loss": 0.6686992049217224, + "train/total_loss": 1.0929715633392334 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3745303750038147, - "train/contrastive_loss": 3.0760979652404785, - "train/negative_loss": 2.3487327098846436, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.7273651361465454, - "train/total_loss": 0.9897499680519104 + "train/classification_loss": 0.3799186050891876, + "train/contrastive_loss": 2.24226713180542, + "train/negative_loss": 1.9748241901397705, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.2674430012702942, + "train/total_loss": 0.8283720016479492 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36574727296829224, - "train/contrastive_loss": 1.9255603551864624, - "train/negative_loss": 1.6207795143127441, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.3047808110713959, - "train/total_loss": 0.7508593797683716 + "train/classification_loss": 0.3319740891456604, + "train/contrastive_loss": 2.5897202491760254, + "train/negative_loss": 2.5885169506073, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0012032873928546906, + "train/total_loss": 0.8499181270599365 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3506954312324524, - "train/contrastive_loss": 2.3875203132629395, - "train/negative_loss": 2.254537582397461, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.1329827457666397, - "train/total_loss": 0.8281995058059692 + "train/classification_loss": 0.34652575850486755, + "train/contrastive_loss": 3.9046382904052734, + "train/negative_loss": 3.165811538696289, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7388266921043396, + "train/total_loss": 1.1274534463882446 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3917487561702728, - "train/contrastive_loss": 2.3338468074798584, - "train/negative_loss": 2.332268238067627, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.001578622730448842, - "train/total_loss": 0.858518123626709 + "train/classification_loss": 0.3571394085884094, + "train/contrastive_loss": 3.291074514389038, + "train/negative_loss": 3.213367223739624, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.07770735025405884, + "train/total_loss": 1.0153543949127197 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3679038882255554, - "train/contrastive_loss": 2.6831815242767334, - "train/negative_loss": 1.4780232906341553, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.2051582336425781, - "train/total_loss": 0.9045401811599731 + "train/classification_loss": 0.37590229511260986, + "train/contrastive_loss": 2.5141170024871826, + "train/negative_loss": 2.1928822994232178, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.3212346136569977, + "train/total_loss": 0.8787257075309753 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3481193780899048, - "train/contrastive_loss": 3.8094840049743652, - "train/negative_loss": 3.0918545722961426, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7176293134689331, - "train/total_loss": 1.110016107559204 + "train/classification_loss": 0.38263601064682007, + "train/contrastive_loss": 2.3549444675445557, + "train/negative_loss": 2.1411330699920654, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.21381144225597382, + "train/total_loss": 0.8536249399185181 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.33463940024375916, - "train/contrastive_loss": 5.6635589599609375, - "train/negative_loss": 2.9082088470458984, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.755350112915039, - "train/total_loss": 1.4673511981964111 + "train/classification_loss": 0.3225128948688507, + "train/contrastive_loss": 2.863142728805542, + "train/negative_loss": 2.797741651535034, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.06540101021528244, + "train/total_loss": 0.8951414823532104 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34790828824043274, - "train/contrastive_loss": 3.577874183654785, - "train/negative_loss": 3.271744966506958, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.30612912774086, - "train/total_loss": 1.0634831190109253 + "train/classification_loss": 0.3632167875766754, + "train/contrastive_loss": 2.3178040981292725, + "train/negative_loss": 2.260415554046631, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.05738852918148041, + "train/total_loss": 0.8267775774002075 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34405311942100525, - "train/contrastive_loss": 2.6842496395111084, - "train/negative_loss": 2.1029293537139893, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.5813202857971191, - "train/total_loss": 0.8809030055999756 + "train/classification_loss": 0.40489381551742554, + "train/contrastive_loss": 3.3704092502593994, + "train/negative_loss": 3.349266529083252, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.02114260569214821, + "train/total_loss": 1.0789756774902344 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36204737424850464, - "train/contrastive_loss": 2.374380350112915, - "train/negative_loss": 2.369652271270752, - "train/num_negatives": 46, + "train/classification_loss": 0.3605867326259613, + "train/contrastive_loss": 1.298163890838623, + "train/negative_loss": 1.2663718461990356, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.03179203346371651, + "train/total_loss": 0.6202195286750793 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.36784157156944275, + "train/contrastive_loss": 2.1754696369171143, + "train/negative_loss": 2.11150860786438, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.004728042520582676, - "train/total_loss": 0.8369234800338745 + "train/positive_loss": 0.0639609694480896, + "train/total_loss": 0.8029354810714722 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3510177433490753, - "train/contrastive_loss": 2.354527235031128, - "train/negative_loss": 2.3529369831085205, + "train/classification_loss": 0.324373334646225, + "train/contrastive_loss": 1.6347603797912598, + "train/negative_loss": 1.5759810209274292, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0015902043087407947, - "train/total_loss": 0.8219231963157654 + "train/num_positives": 10, + "train/positive_loss": 0.05877934768795967, + "train/total_loss": 0.6513254046440125 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.3359071612358093, + "train/contrastive_loss": 3.9236061573028564, + "train/negative_loss": 3.7024834156036377, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.22112280130386353, + "train/total_loss": 1.1206283569335938 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.38063234090805054, + "train/contrastive_loss": 1.5380961894989014, + "train/negative_loss": 1.5096781253814697, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.02841809019446373, + "train/total_loss": 0.6882516145706177 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3419603407382965, - "train/contrastive_loss": 1.7020747661590576, - "train/negative_loss": 1.6635327339172363, + "train/classification_loss": 0.35039278864860535, + "train/contrastive_loss": 2.1888599395751953, + "train/negative_loss": 2.157989263534546, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.03854206204414368, - "train/total_loss": 0.6823753118515015 + "train/positive_loss": 0.03087073564529419, + "train/total_loss": 0.7881647944450378 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34513160586357117, - "train/contrastive_loss": 1.8975372314453125, - "train/negative_loss": 1.8852378129959106, - "train/num_negatives": 36, + "train/classification_loss": 0.3656606674194336, + "train/contrastive_loss": 2.470716714859009, + "train/negative_loss": 2.41229248046875, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.05842426419258118, + "train/total_loss": 0.8598040342330933 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.38602688908576965, + "train/contrastive_loss": 3.937988758087158, + "train/negative_loss": 3.6602749824523926, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.012299465015530586, - "train/total_loss": 0.7246390581130981 + "train/positive_loss": 0.2777137756347656, + "train/total_loss": 1.1736246347427368 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.368398517370224, - "train/contrastive_loss": 2.7965428829193115, - "train/negative_loss": 2.616300344467163, + "train/classification_loss": 0.3479618430137634, + "train/contrastive_loss": 3.955038547515869, + "train/negative_loss": 2.2126057147979736, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.7424328327178955, + "train/total_loss": 1.1389695405960083 + }, + { + "epoch": 0.704225352112676, + "step": 200, + "train/classification_loss": 0.35680314898490906, + "train/contrastive_loss": 2.5151901245117188, + "train/negative_loss": 2.3891406059265137, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.18024246394634247, - "train/total_loss": 0.9277070760726929 + "train/num_positives": 14, + "train/positive_loss": 0.12604950368404388, + "train/total_loss": 0.8598412275314331 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3396446704864502, - "train/contrastive_loss": 3.2021076679229736, - "train/negative_loss": 2.78757381439209, + "train/classification_loss": 0.37067681550979614, + "train/contrastive_loss": 3.4200215339660645, + "train/negative_loss": 3.37809419631958, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.41453391313552856, - "train/total_loss": 0.9800662398338318 + "train/num_positives": 2, + "train/positive_loss": 0.04192742332816124, + "train/total_loss": 1.0546810626983643 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.33377429842948914, - "train/contrastive_loss": 1.4925134181976318, - "train/negative_loss": 1.347885012626648, + "train/classification_loss": 0.3493765592575073, + "train/contrastive_loss": 2.4909698963165283, + "train/negative_loss": 2.1821136474609375, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.1446283459663391, - "train/total_loss": 0.6322770118713379 + "train/num_positives": 16, + "train/positive_loss": 0.3088562786579132, + "train/total_loss": 0.847570538520813 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3873163163661957, - "train/contrastive_loss": 2.383845090866089, - "train/negative_loss": 2.329446315765381, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.05439874529838562, - "train/total_loss": 0.86408531665802 + "train/classification_loss": 0.37985509634017944, + "train/contrastive_loss": 2.908679962158203, + "train/negative_loss": 2.8500924110412598, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.058587461709976196, + "train/total_loss": 0.9615911245346069 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3322080373764038, - "train/contrastive_loss": 1.7163742780685425, - "train/negative_loss": 1.7124805450439453, - "train/num_negatives": 48, + "train/classification_loss": 0.37945207953453064, + "train/contrastive_loss": 2.2139487266540527, + "train/negative_loss": 2.086418867111206, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0038937099743634462, - "train/total_loss": 0.6754828691482544 + "train/positive_loss": 0.1275298297405243, + "train/total_loss": 0.8222418427467346 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.35688260197639465, - "train/contrastive_loss": 1.1968886852264404, - "train/negative_loss": 0.7679566144943237, + "train/classification_loss": 0.3666813373565674, + "train/contrastive_loss": 1.779737949371338, + "train/negative_loss": 1.7209254503250122, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.4289321303367615, - "train/total_loss": 0.5962603092193604 + "train/num_positives": 14, + "train/positive_loss": 0.058812472969293594, + "train/total_loss": 0.7226289510726929 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.33920884132385254, - "train/contrastive_loss": 2.9789772033691406, - "train/negative_loss": 2.847315549850464, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.13166159391403198, - "train/total_loss": 0.9350042939186096 + "train/classification_loss": 0.4065815210342407, + "train/contrastive_loss": 3.4165267944335938, + "train/negative_loss": 3.373825788497925, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.04270093888044357, + "train/total_loss": 1.0898869037628174 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.38580480217933655, - "train/contrastive_loss": 1.0609130859375, - "train/negative_loss": 0.8914381265640259, - "train/num_negatives": 28, + "train/classification_loss": 0.33919551968574524, + "train/contrastive_loss": 2.654151439666748, + "train/negative_loss": 2.6463871002197266, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.1694749891757965, - "train/total_loss": 0.5979874134063721 + "train/positive_loss": 0.007764222100377083, + "train/total_loss": 0.8700258731842041 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36553457379341125, - "train/contrastive_loss": 2.033005952835083, - "train/negative_loss": 1.5298676490783691, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5031383037567139, - "train/total_loss": 0.7721357345581055 + "train/classification_loss": 0.33839792013168335, + "train/contrastive_loss": 2.9100310802459717, + "train/negative_loss": 2.9021646976470947, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.007866277359426022, + "train/total_loss": 0.9204041361808777 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3414057493209839, - "train/contrastive_loss": 2.2091939449310303, - "train/negative_loss": 2.129155158996582, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.08003868907690048, - "train/total_loss": 0.7832445502281189 + "train/classification_loss": 0.3517836332321167, + "train/contrastive_loss": 2.234933614730835, + "train/negative_loss": 2.2329797744750977, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.0019538896158337593, + "train/total_loss": 0.7987703680992126 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3462255597114563, - "train/contrastive_loss": 2.4438347816467285, - "train/negative_loss": 1.3836157321929932, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0602190494537354, - "train/total_loss": 0.834992527961731 + "train/classification_loss": 0.36322763562202454, + "train/contrastive_loss": 4.510669708251953, + "train/negative_loss": 2.5318989753723145, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.9787707328796387, + "train/total_loss": 1.2653615474700928 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34299638867378235, - "train/contrastive_loss": 4.2317376136779785, - "train/negative_loss": 3.805967092514038, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4257703423500061, - "train/total_loss": 1.1893439292907715 + "train/classification_loss": 0.36761924624443054, + "train/contrastive_loss": 2.8496103286743164, + "train/negative_loss": 2.7521278858184814, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.09748252481222153, + "train/total_loss": 0.9375413656234741 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.35235947370529175, - "train/contrastive_loss": 2.3517916202545166, - "train/negative_loss": 1.865363359451294, + "train/classification_loss": 0.350806325674057, + "train/contrastive_loss": 1.2713918685913086, + "train/negative_loss": 1.189595341682434, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.4864283502101898, - "train/total_loss": 0.8227177858352661 + "train/num_positives": 16, + "train/positive_loss": 0.08179657906293869, + "train/total_loss": 0.6050847172737122 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.33627578616142273, - "train/contrastive_loss": 3.331023693084717, - "train/negative_loss": 3.1072545051574707, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.2237691879272461, - "train/total_loss": 1.0024805068969727 + "train/classification_loss": 0.35948753356933594, + "train/contrastive_loss": 3.549363851547241, + "train/negative_loss": 3.200535535812378, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.34882837533950806, + "train/total_loss": 1.0693602561950684 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3738948702812195, - "train/contrastive_loss": 2.950991153717041, - "train/negative_loss": 2.5014560222625732, + "train/classification_loss": 0.3650091290473938, + "train/contrastive_loss": 3.3538875579833984, + "train/negative_loss": 3.3494699001312256, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.4495352506637573, - "train/total_loss": 0.9640930891036987 + "train/num_positives": 2, + "train/positive_loss": 0.00441768579185009, + "train/total_loss": 1.0357866287231445 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3459518551826477, - "train/contrastive_loss": 2.9752302169799805, - "train/negative_loss": 2.963716983795166, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.01151323039084673, - "train/total_loss": 0.9409978985786438 + "train/classification_loss": 0.3346955478191376, + "train/contrastive_loss": 3.4461872577667236, + "train/negative_loss": 3.434870481491089, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.01131683774292469, + "train/total_loss": 1.0239330530166626 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.331338495016098, - "train/contrastive_loss": 2.0834391117095947, - "train/negative_loss": 1.747328281402588, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.3361107409000397, - "train/total_loss": 0.7480263113975525 + "train/classification_loss": 0.35658740997314453, + "train/contrastive_loss": 3.258201837539673, + "train/negative_loss": 3.1837801933288574, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.07442161440849304, + "train/total_loss": 1.008227825164795 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.34600263833999634, - "train/contrastive_loss": 2.091334104537964, - "train/negative_loss": 1.9828624725341797, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.10847169160842896, - "train/total_loss": 0.7642694711685181 + "train/classification_loss": 0.3788551390171051, + "train/contrastive_loss": 4.408748626708984, + "train/negative_loss": 2.54168963432312, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.8670587539672852, + "train/total_loss": 1.2606048583984375 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3637847900390625, - "train/contrastive_loss": 2.7883191108703613, - "train/negative_loss": 2.282731771469116, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.5055872201919556, - "train/total_loss": 0.9214486479759216 + "train/classification_loss": 0.3525297939777374, + "train/contrastive_loss": 3.835818290710449, + "train/negative_loss": 3.8349013328552246, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0009169792756438255, + "train/total_loss": 1.1196935176849365 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3520596921443939, - "train/contrastive_loss": 2.7270517349243164, - "train/negative_loss": 2.436143398284912, + "train/classification_loss": 0.3724968135356903, + "train/contrastive_loss": 1.8083879947662354, + "train/negative_loss": 1.6629879474639893, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.29090824723243713, - "train/total_loss": 0.8974699974060059 + "train/positive_loss": 0.14540009200572968, + "train/total_loss": 0.7341744303703308 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.36030033230781555, - "train/contrastive_loss": 1.451364517211914, - "train/negative_loss": 1.4473069906234741, + "train/classification_loss": 0.3550809919834137, + "train/contrastive_loss": 2.303849458694458, + "train/negative_loss": 2.2234840393066406, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.004057473503053188, - "train/total_loss": 0.6505732536315918 + "train/num_positives": 8, + "train/positive_loss": 0.08036541193723679, + "train/total_loss": 0.8158508539199829 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.32881563901901245, - "train/contrastive_loss": 3.862379312515259, - "train/negative_loss": 3.6684770584106445, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.19390232861042023, - "train/total_loss": 1.101291537284851 + "train/classification_loss": 0.32960572838783264, + "train/contrastive_loss": 3.2862935066223145, + "train/negative_loss": 3.2755134105682373, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.010780061595141888, + "train/total_loss": 0.986864447593689 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.3583086133003235, - "train/contrastive_loss": 2.5388364791870117, - "train/negative_loss": 2.4129137992858887, - "train/num_negatives": 46, + "train/classification_loss": 0.37115204334259033, + "train/contrastive_loss": 2.861098289489746, + "train/negative_loss": 2.4897360801696777, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.1259227693080902, - "train/total_loss": 0.8660759329795837 + "train/positive_loss": 0.3713622987270355, + "train/total_loss": 0.9433717131614685 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.38607850670814514, - "train/contrastive_loss": 1.970755696296692, - "train/negative_loss": 1.970755696296692, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.7802296876907349 + "train/classification_loss": 0.37576794624328613, + "train/contrastive_loss": 2.9777140617370605, + "train/negative_loss": 2.5580532550811768, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.4196608364582062, + "train/total_loss": 0.9713107943534851 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "eval_exact_match_accuracy": 0.0, - "eval_hamming_loss": 0.0984873949579832, - "eval_loss": 0.8576530814170837, - "eval_macro_f1": 0.0, - "eval_macro_precision": 0.0, - "eval_macro_recall": 0.0, - "eval_micro_f1": 0.0, - "eval_micro_precision": 0.0, - "eval_micro_recall": 0.0, - "eval_runtime": 2.5751, - "eval_samples_per_second": 203.875, - "eval_steps_per_second": 25.63, + "eval_hamming_loss": 0.09720925407199917, + "eval_loss": 0.9205195307731628, + "eval_macro_f1": 0.0006033182503770739, + "eval_macro_precision": 0.058823529411764705, + "eval_macro_recall": 0.00030321406913280777, + "eval_micro_f1": 0.002129925452609159, + "eval_micro_precision": 1.0, + "eval_micro_recall": 0.0010660980810234541, + "eval_runtime": 2.8545, + "eval_samples_per_second": 198.633, + "eval_steps_per_second": 24.873, "step": 200 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.39491283893585205, - "train/contrastive_loss": 2.230945587158203, - "train/negative_loss": 1.4184013605117798, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.8125442862510681, - "train/total_loss": 0.8411020040512085 + "train/classification_loss": 0.3534598648548126, + "train/contrastive_loss": 1.6415746212005615, + "train/negative_loss": 1.2293429374694824, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.4122316539287567, + "train/total_loss": 0.6817747950553894 }, { - "epoch": 0.7604562737642585, + "epoch": 0.704225352112676, "step": 200, - "train/classification_loss": 0.35897472500801086, - "train/contrastive_loss": 1.6095407009124756, - "train/negative_loss": 1.0223037004470825, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5872370004653931, - "train/total_loss": 0.6808828711509705 + "train/classification_loss": 0.3670371174812317, + "train/contrastive_loss": 1.2740015983581543, + "train/negative_loss": 0.9414844512939453, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.33251717686653137, + "train/total_loss": 0.6218374371528625 }, { - "epoch": 0.9505703422053232, - "grad_norm": 21.209495544433594, - "learning_rate": 1.9977625570776257e-05, - "loss": 1.3557, + "epoch": 0.8802816901408451, + "grad_norm": 17.732545852661133, + "learning_rate": 1.997928118393235e-05, + "loss": 1.3539, "step": 250 }, { - "epoch": 0.9505703422053232, + "epoch": 0.8802816901408451, "step": 250, - "train/classification_loss": 0.31806451082229614, - "train/contrastive_loss": 1.6106826066970825, - "train/negative_loss": 1.1766853332519531, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.4339972734451294, - "train/total_loss": 0.6402010321617126 + "train/classification_loss": 0.3377353549003601, + "train/contrastive_loss": 2.0764522552490234, + "train/negative_loss": 1.2744636535644531, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8019887208938599, + "train/total_loss": 0.7530257701873779 }, { - "epoch": 0.9505703422053232, + "epoch": 0.8802816901408451, "step": 250, - "train/classification_loss": 0.2628883421421051, - "train/contrastive_loss": 1.5048027038574219, - "train/negative_loss": 1.4083112478256226, - "train/num_negatives": 24, - "train/num_positives": 32, - "train/positive_loss": 0.09649147093296051, - "train/total_loss": 0.5638488531112671 + "train/classification_loss": 0.3293566405773163, + "train/contrastive_loss": 2.125258445739746, + "train/negative_loss": 1.2052654027938843, + "train/num_negatives": 30, + "train/num_positives": 12, + "train/positive_loss": 0.9199931621551514, + "train/total_loss": 0.7544083595275879 }, { - "epoch": 1.1406844106463878, - "grad_norm": 16.87105941772461, - "learning_rate": 1.9970015220700155e-05, - "loss": 1.261, + "epoch": 1.056338028169014, + "grad_norm": 20.307628631591797, + "learning_rate": 1.9972233967582807e-05, + "loss": 1.2688, "step": 300 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3311900496482849, - "train/contrastive_loss": 2.5159664154052734, - "train/negative_loss": 1.703377604484558, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8125887513160706, - "train/total_loss": 0.8343833684921265 + "train/classification_loss": 0.30594518780708313, + "train/contrastive_loss": 2.4988250732421875, + "train/negative_loss": 2.49473237991333, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.004092785529792309, + "train/total_loss": 0.8057101964950562 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30819466710090637, - "train/contrastive_loss": 3.584254503250122, - "train/negative_loss": 3.1056554317474365, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.47859910130500793, - "train/total_loss": 1.02504563331604 + "train/classification_loss": 0.36961638927459717, + "train/contrastive_loss": 2.229480028152466, + "train/negative_loss": 2.1767866611480713, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.05269325524568558, + "train/total_loss": 0.8155124187469482 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2846865952014923, - "train/contrastive_loss": 3.214858055114746, - "train/negative_loss": 2.0745797157287598, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1402784585952759, - "train/total_loss": 0.927658200263977 + "train/classification_loss": 0.31562164425849915, + "train/contrastive_loss": 3.3603179454803467, + "train/negative_loss": 2.18591570854187, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1744022369384766, + "train/total_loss": 0.9876852035522461 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.28454238176345825, - "train/contrastive_loss": 2.6428890228271484, - "train/negative_loss": 1.922734022140503, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.7201549410820007, - "train/total_loss": 0.8131201863288879 + "train/classification_loss": 0.260353684425354, + "train/contrastive_loss": 2.384992837905884, + "train/negative_loss": 2.353367567062378, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.03162530064582825, + "train/total_loss": 0.7373522520065308 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3244551122188568, - "train/contrastive_loss": 1.6570758819580078, - "train/negative_loss": 1.3382107019424438, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.3188651204109192, - "train/total_loss": 0.6558703184127808 + "train/classification_loss": 0.29958847165107727, + "train/contrastive_loss": 3.18422269821167, + "train/negative_loss": 3.019544839859009, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.1646779477596283, + "train/total_loss": 0.9364330768585205 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30504703521728516, - "train/contrastive_loss": 2.757450580596924, - "train/negative_loss": 2.4901654720306396, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.26728522777557373, - "train/total_loss": 0.8565371632575989 + "train/classification_loss": 0.30007806420326233, + "train/contrastive_loss": 3.0554862022399902, + "train/negative_loss": 2.2332777976989746, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8222082853317261, + "train/total_loss": 0.9111753702163696 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3390626907348633, - "train/contrastive_loss": 2.825791358947754, - "train/negative_loss": 2.700735569000244, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.12505587935447693, - "train/total_loss": 0.9042209982872009 + "train/classification_loss": 0.29807448387145996, + "train/contrastive_loss": 2.0360546112060547, + "train/negative_loss": 1.878265380859375, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.15778911113739014, + "train/total_loss": 0.7052854299545288 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.25914135575294495, - "train/contrastive_loss": 2.4474306106567383, - "train/negative_loss": 2.0465307235717773, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4008999466896057, - "train/total_loss": 0.7486274838447571 + "train/classification_loss": 0.33394795656204224, + "train/contrastive_loss": 1.64840829372406, + "train/negative_loss": 1.6481661796569824, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00024208375543821603, + "train/total_loss": 0.6636296510696411 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.27669984102249146, - "train/contrastive_loss": 2.2188913822174072, - "train/negative_loss": 2.215890407562256, + "train/classification_loss": 0.31289201974868774, + "train/contrastive_loss": 1.3649917840957642, + "train/negative_loss": 1.2146955728530884, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.003001060802489519, - "train/total_loss": 0.7204781174659729 + "train/positive_loss": 0.1502961814403534, + "train/total_loss": 0.5858904123306274 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3379654884338379, - "train/contrastive_loss": 4.418155670166016, - "train/negative_loss": 3.475825309753418, + "train/classification_loss": 0.31317582726478577, + "train/contrastive_loss": 3.554135799407959, + "train/negative_loss": 2.103843927383423, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9423301219940186, - "train/total_loss": 1.2215967178344727 + "train/num_positives": 14, + "train/positive_loss": 1.4502917528152466, + "train/total_loss": 1.024003028869629 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2915635406970978, - "train/contrastive_loss": 2.3736963272094727, - "train/negative_loss": 2.2806899547576904, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.09300631284713745, - "train/total_loss": 0.7663028240203857 + "train/classification_loss": 0.2947699725627899, + "train/contrastive_loss": 2.4679057598114014, + "train/negative_loss": 2.399268865585327, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.06863680481910706, + "train/total_loss": 0.7883511185646057 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2719399034976959, - "train/contrastive_loss": 2.558049201965332, - "train/negative_loss": 2.4975368976593018, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.060512199997901917, - "train/total_loss": 0.7835497856140137 + "train/classification_loss": 0.31243011355400085, + "train/contrastive_loss": 1.931992530822754, + "train/negative_loss": 1.9139418601989746, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.018050648272037506, + "train/total_loss": 0.6988286375999451 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3022117018699646, - "train/contrastive_loss": 3.82729172706604, - "train/negative_loss": 3.3631398677825928, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.46415194869041443, - "train/total_loss": 1.0676701068878174 + "train/classification_loss": 0.29993221163749695, + "train/contrastive_loss": 5.04127836227417, + "train/negative_loss": 3.258833646774292, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.7824445962905884, + "train/total_loss": 1.3081879615783691 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2861654758453369, - "train/contrastive_loss": 2.0566952228546143, - "train/negative_loss": 2.0304324626922607, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.026262715458869934, - "train/total_loss": 0.6975045204162598 + "train/classification_loss": 0.3398338258266449, + "train/contrastive_loss": 4.088870048522949, + "train/negative_loss": 1.8648176193237305, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 2.224052667617798, + "train/total_loss": 1.1576077938079834 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2622973918914795, - "train/contrastive_loss": 2.8588292598724365, - "train/negative_loss": 2.8344078063964844, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.024421511217951775, - "train/total_loss": 0.8340632319450378 + "train/classification_loss": 0.24651873111724854, + "train/contrastive_loss": 2.714564085006714, + "train/negative_loss": 2.345625638961792, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.3689383864402771, + "train/total_loss": 0.7894315719604492 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2802102863788605, - "train/contrastive_loss": 1.7099977731704712, - "train/negative_loss": 1.510746717453003, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.19925101101398468, - "train/total_loss": 0.6222098469734192 + "train/classification_loss": 0.3147347569465637, + "train/contrastive_loss": 3.5181074142456055, + "train/negative_loss": 2.768947124481201, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.7491604089736938, + "train/total_loss": 1.0183563232421875 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.31750431656837463, - "train/contrastive_loss": 2.2720117568969727, - "train/negative_loss": 2.0746233463287354, - "train/num_negatives": 40, + "train/classification_loss": 0.2947418987751007, + "train/contrastive_loss": 2.9206302165985107, + "train/negative_loss": 2.7699949741363525, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.19738835096359253, - "train/total_loss": 0.7719066739082336 + "train/positive_loss": 0.15063515305519104, + "train/total_loss": 0.8788679838180542 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.34297657012939453, - "train/contrastive_loss": 2.1303646564483643, - "train/negative_loss": 1.8917371034622192, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.2386276125907898, - "train/total_loss": 0.7690495252609253 + "train/classification_loss": 0.3061610758304596, + "train/contrastive_loss": 3.530163288116455, + "train/negative_loss": 3.253753185272217, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.27641019225120544, + "train/total_loss": 1.0121937990188599 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3348046839237213, - "train/contrastive_loss": 1.864820122718811, - "train/negative_loss": 1.8440401554107666, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.020779980346560478, - "train/total_loss": 0.7077686786651611 + "train/classification_loss": 0.3312360644340515, + "train/contrastive_loss": 1.7040787935256958, + "train/negative_loss": 1.6804348230361938, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.02364397421479225, + "train/total_loss": 0.6720517873764038 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2850024998188019, - "train/contrastive_loss": 3.6059298515319824, - "train/negative_loss": 3.3557891845703125, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2501407861709595, - "train/total_loss": 1.0061885118484497 + "train/classification_loss": 0.26763319969177246, + "train/contrastive_loss": 2.2348668575286865, + "train/negative_loss": 2.1961047649383545, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.03876205533742905, + "train/total_loss": 0.7146065831184387 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.32808980345726013, - "train/contrastive_loss": 3.323831796646118, - "train/negative_loss": 2.5689518451690674, - "train/num_negatives": 44, + "train/classification_loss": 0.28071412444114685, + "train/contrastive_loss": 1.3188576698303223, + "train/negative_loss": 1.1333078145980835, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.7548799514770508, - "train/total_loss": 0.9928561449050903 + "train/positive_loss": 0.185549795627594, + "train/total_loss": 0.5444856882095337 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.34635129570961, - "train/contrastive_loss": 3.302574872970581, - "train/negative_loss": 3.3003475666046143, - "train/num_negatives": 44, + "train/classification_loss": 0.2643817067146301, + "train/contrastive_loss": 3.064574718475342, + "train/negative_loss": 2.9858994483947754, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.002227221382781863, - "train/total_loss": 1.0068663358688354 + "train/positive_loss": 0.07867515087127686, + "train/total_loss": 0.8772966861724854 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.27829480171203613, - "train/contrastive_loss": 2.382777690887451, - "train/negative_loss": 1.770250678062439, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6125270128250122, - "train/total_loss": 0.7548503875732422 + "train/classification_loss": 0.3155921697616577, + "train/contrastive_loss": 2.911530017852783, + "train/negative_loss": 1.8282358646392822, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.0832940340042114, + "train/total_loss": 0.8978981971740723 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2630482316017151, - "train/contrastive_loss": 1.7943289279937744, - "train/negative_loss": 1.6165958642959595, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.17773304879665375, - "train/total_loss": 0.6219140291213989 + "train/classification_loss": 0.33588844537734985, + "train/contrastive_loss": 2.692957639694214, + "train/negative_loss": 1.6892998218536377, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.0036578178405762, + "train/total_loss": 0.8744800090789795 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.24599485099315643, - "train/contrastive_loss": 2.8403139114379883, - "train/negative_loss": 2.8199398517608643, + "train/classification_loss": 0.3198592960834503, + "train/contrastive_loss": 2.034044027328491, + "train/negative_loss": 1.768754243850708, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.020373957231640816, - "train/total_loss": 0.8140576481819153 + "train/num_positives": 10, + "train/positive_loss": 0.26528987288475037, + "train/total_loss": 0.726668119430542 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3282795548439026, - "train/contrastive_loss": 1.3518707752227783, - "train/negative_loss": 0.49805206060409546, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.8538186550140381, - "train/total_loss": 0.5986536741256714 + "train/classification_loss": 0.29373568296432495, + "train/contrastive_loss": 3.501856803894043, + "train/negative_loss": 2.3817152976989746, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.1201415061950684, + "train/total_loss": 0.9941070675849915 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30935174226760864, - "train/contrastive_loss": 2.9191884994506836, - "train/negative_loss": 2.911905527114868, + "train/classification_loss": 0.31500720977783203, + "train/contrastive_loss": 2.423717498779297, + "train/negative_loss": 2.421290636062622, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.007282879203557968, - "train/total_loss": 0.8931894302368164 + "train/num_positives": 4, + "train/positive_loss": 0.0024269737768918276, + "train/total_loss": 0.7997506856918335 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.31560975313186646, - "train/contrastive_loss": 3.381509780883789, - "train/negative_loss": 2.6018850803375244, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.7796245813369751, - "train/total_loss": 0.9919117093086243 + "train/classification_loss": 0.3181622326374054, + "train/contrastive_loss": 1.0337097644805908, + "train/negative_loss": 1.0289721488952637, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.004737657494843006, + "train/total_loss": 0.524904191493988 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3167814314365387, - "train/contrastive_loss": 2.4855895042419434, - "train/negative_loss": 2.338549852371216, - "train/num_negatives": 40, + "train/classification_loss": 0.2979702651500702, + "train/contrastive_loss": 3.610692024230957, + "train/negative_loss": 1.9066754579544067, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.14703965187072754, - "train/total_loss": 0.8138993382453918 + "train/positive_loss": 1.7040166854858398, + "train/total_loss": 1.020108699798584 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3307754099369049, - "train/contrastive_loss": 4.296078681945801, - "train/negative_loss": 3.510606050491333, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.7854723930358887, - "train/total_loss": 1.1899911165237427 + "train/classification_loss": 0.3428727984428406, + "train/contrastive_loss": 1.9881088733673096, + "train/negative_loss": 1.655469536781311, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.3326393663883209, + "train/total_loss": 0.7404946088790894 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.31434470415115356, - "train/contrastive_loss": 2.28171443939209, - "train/negative_loss": 1.5652763843536377, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7164381742477417, - "train/total_loss": 0.7706875801086426 + "train/classification_loss": 0.2712554633617401, + "train/contrastive_loss": 2.010617256164551, + "train/negative_loss": 2.006277561187744, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.004339645616710186, + "train/total_loss": 0.6733789443969727 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.29842182993888855, - "train/contrastive_loss": 3.1961498260498047, - "train/negative_loss": 3.0817878246307373, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.11436188220977783, - "train/total_loss": 0.9376517534255981 + "train/classification_loss": 0.2919139266014099, + "train/contrastive_loss": 4.656617641448975, + "train/negative_loss": 3.2068932056427, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.449724555015564, + "train/total_loss": 1.2232375144958496 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3545219898223877, - "train/contrastive_loss": 2.49855899810791, - "train/negative_loss": 2.498236894607544, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0003221553924959153, - "train/total_loss": 0.8542338013648987 + "train/classification_loss": 0.3088808059692383, + "train/contrastive_loss": 3.0035738945007324, + "train/negative_loss": 2.2147040367126465, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7888697385787964, + "train/total_loss": 0.9095956087112427 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3203617036342621, - "train/contrastive_loss": 2.355663776397705, - "train/negative_loss": 2.1532628536224365, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.20240084826946259, - "train/total_loss": 0.7914944887161255 + "train/classification_loss": 0.3173966109752655, + "train/contrastive_loss": 2.497237205505371, + "train/negative_loss": 1.6290912628173828, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.8681459426879883, + "train/total_loss": 0.8168440461158752 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.29627981781959534, - "train/contrastive_loss": 4.059073448181152, - "train/negative_loss": 2.9663538932800293, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.0927194356918335, - "train/total_loss": 1.108094573020935 + "train/classification_loss": 0.33909109234809875, + "train/contrastive_loss": 3.077838897705078, + "train/negative_loss": 2.4171860218048096, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6606528162956238, + "train/total_loss": 0.9546588659286499 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2795562744140625, - "train/contrastive_loss": 6.9291276931762695, - "train/negative_loss": 3.5817205905914307, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 3.3474068641662598, - "train/total_loss": 1.6653817892074585 + "train/classification_loss": 0.26384925842285156, + "train/contrastive_loss": 3.8524835109710693, + "train/negative_loss": 3.6561694145202637, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.1963140368461609, + "train/total_loss": 1.0343459844589233 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.29684361815452576, - "train/contrastive_loss": 3.758542060852051, - "train/negative_loss": 3.272798538208008, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.4857436418533325, - "train/total_loss": 1.0485520362854004 + "train/classification_loss": 0.3107200562953949, + "train/contrastive_loss": 2.201188087463379, + "train/negative_loss": 1.7593269348144531, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.4418611526489258, + "train/total_loss": 0.7509576678276062 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2857086956501007, - "train/contrastive_loss": 2.5368218421936035, - "train/negative_loss": 2.3057985305786133, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.23102323710918427, - "train/total_loss": 0.7930730581283569 + "train/classification_loss": 0.3748219311237335, + "train/contrastive_loss": 4.88300085067749, + "train/negative_loss": 4.8675031661987305, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.015497865155339241, + "train/total_loss": 1.3514220714569092 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.31555646657943726, - "train/contrastive_loss": 2.501011610031128, - "train/negative_loss": 2.4832587242126465, - "train/num_negatives": 46, + "train/classification_loss": 0.3118785619735718, + "train/contrastive_loss": 1.8053268194198608, + "train/negative_loss": 1.709904670715332, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0954221561551094, + "train/total_loss": 0.6729439496994019 + }, + { + "epoch": 1.056338028169014, + "step": 300, + "train/classification_loss": 0.32360708713531494, + "train/contrastive_loss": 3.670279026031494, + "train/negative_loss": 3.0591373443603516, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.017752807587385178, - "train/total_loss": 0.8157588243484497 + "train/positive_loss": 0.611141562461853, + "train/total_loss": 1.0576629638671875 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3001801669597626, - "train/contrastive_loss": 3.2040703296661377, - "train/negative_loss": 3.2038421630859375, + "train/classification_loss": 0.26719018816947937, + "train/contrastive_loss": 1.7779717445373535, + "train/negative_loss": 1.552098035812378, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.00022825223277322948, - "train/total_loss": 0.9409942626953125 + "train/num_positives": 10, + "train/positive_loss": 0.22587375342845917, + "train/total_loss": 0.6227845549583435 + }, + { + "epoch": 1.056338028169014, + "step": 300, + "train/classification_loss": 0.27464035153388977, + "train/contrastive_loss": 4.823848724365234, + "train/negative_loss": 4.2317962646484375, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5920522809028625, + "train/total_loss": 1.239410161972046 + }, + { + "epoch": 1.056338028169014, + "step": 300, + "train/classification_loss": 0.3322891294956207, + "train/contrastive_loss": 2.0012426376342773, + "train/negative_loss": 1.9953967332839966, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.005845996551215649, + "train/total_loss": 0.7325376272201538 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.28472691774368286, - "train/contrastive_loss": 1.7473807334899902, - "train/negative_loss": 1.743579626083374, + "train/classification_loss": 0.3042404353618622, + "train/contrastive_loss": 3.341874122619629, + "train/negative_loss": 3.3319761753082275, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.0038010524585843086, - "train/total_loss": 0.6342030763626099 + "train/positive_loss": 0.009897973388433456, + "train/total_loss": 0.9726152420043945 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2894015610218048, - "train/contrastive_loss": 2.797426462173462, - "train/negative_loss": 2.7002365589141846, - "train/num_negatives": 36, + "train/classification_loss": 0.3163105547428131, + "train/contrastive_loss": 2.1025753021240234, + "train/negative_loss": 1.6227657794952393, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.47980961203575134, + "train/total_loss": 0.7368255853652954 + }, + { + "epoch": 1.056338028169014, + "step": 300, + "train/classification_loss": 0.35113173723220825, + "train/contrastive_loss": 3.732910633087158, + "train/negative_loss": 3.2763113975524902, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.09718982875347137, - "train/total_loss": 0.8488868474960327 + "train/positive_loss": 0.45659929513931274, + "train/total_loss": 1.0977139472961426 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.32310640811920166, - "train/contrastive_loss": 3.3808000087738037, - "train/negative_loss": 3.3086330890655518, + "train/classification_loss": 0.28845012187957764, + "train/contrastive_loss": 2.3967533111572266, + "train/negative_loss": 1.6205039024353027, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7762492895126343, + "train/total_loss": 0.7678008079528809 + }, + { + "epoch": 1.056338028169014, + "step": 300, + "train/classification_loss": 0.311286598443985, + "train/contrastive_loss": 2.243960380554199, + "train/negative_loss": 1.697359561920166, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.07216700911521912, - "train/total_loss": 0.9992664456367493 + "train/num_positives": 14, + "train/positive_loss": 0.5466007590293884, + "train/total_loss": 0.7600786685943604 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2838151752948761, - "train/contrastive_loss": 3.739941358566284, - "train/negative_loss": 3.266683578491211, + "train/classification_loss": 0.329230934381485, + "train/contrastive_loss": 2.6925671100616455, + "train/negative_loss": 2.6917529106140137, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.47325778007507324, - "train/total_loss": 1.0318034887313843 + "train/num_positives": 2, + "train/positive_loss": 0.0008141135331243277, + "train/total_loss": 0.8677443265914917 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2764193117618561, - "train/contrastive_loss": 1.8691608905792236, - "train/negative_loss": 1.6223363876342773, + "train/classification_loss": 0.2909841537475586, + "train/contrastive_loss": 2.3947298526763916, + "train/negative_loss": 1.6677296161651611, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2468244433403015, - "train/total_loss": 0.6502515077590942 + "train/num_positives": 16, + "train/positive_loss": 0.7270002365112305, + "train/total_loss": 0.7699301242828369 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3486481308937073, - "train/contrastive_loss": 2.6942453384399414, - "train/negative_loss": 2.576687812805176, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.11755752563476562, - "train/total_loss": 0.8874971866607666 + "train/classification_loss": 0.3502001464366913, + "train/contrastive_loss": 3.011383056640625, + "train/negative_loss": 2.275353193283081, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.736029863357544, + "train/total_loss": 0.9524767398834229 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.26995208859443665, - "train/contrastive_loss": 2.3868443965911865, - "train/negative_loss": 2.3861751556396484, - "train/num_negatives": 48, + "train/classification_loss": 0.3382168710231781, + "train/contrastive_loss": 1.9932276010513306, + "train/negative_loss": 1.863538384437561, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0006692271563224494, - "train/total_loss": 0.7473210096359253 + "train/positive_loss": 0.12968920171260834, + "train/total_loss": 0.7368624210357666 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30062615871429443, - "train/contrastive_loss": 1.4550412893295288, - "train/negative_loss": 1.2852600812911987, + "train/classification_loss": 0.31939324736595154, + "train/contrastive_loss": 1.3574552536010742, + "train/negative_loss": 1.290783166885376, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.16978125274181366, - "train/total_loss": 0.5916343927383423 + "train/num_positives": 14, + "train/positive_loss": 0.06667205691337585, + "train/total_loss": 0.5908843278884888 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.28400516510009766, - "train/contrastive_loss": 3.97418212890625, - "train/negative_loss": 3.9725892543792725, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0015928089851513505, - "train/total_loss": 1.0788416862487793 + "train/classification_loss": 0.37328213453292847, + "train/contrastive_loss": 2.9023702144622803, + "train/negative_loss": 2.844270706176758, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.05809956043958664, + "train/total_loss": 0.9537562131881714 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.34289854764938354, - "train/contrastive_loss": 0.8920086026191711, - "train/negative_loss": 0.8704383373260498, - "train/num_negatives": 28, + "train/classification_loss": 0.284429669380188, + "train/contrastive_loss": 2.50447678565979, + "train/negative_loss": 2.5031793117523193, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.02157028578221798, - "train/total_loss": 0.5213002562522888 + "train/positive_loss": 0.0012975239660590887, + "train/total_loss": 0.7853250503540039 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.31150728464126587, - "train/contrastive_loss": 3.3335628509521484, - "train/negative_loss": 2.4695451259613037, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8640177845954895, - "train/total_loss": 0.9782198667526245 + "train/classification_loss": 0.28343111276626587, + "train/contrastive_loss": 2.2238190174102783, + "train/negative_loss": 2.1554484367370605, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.06837065517902374, + "train/total_loss": 0.7281949520111084 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.28393611311912537, - "train/contrastive_loss": 2.801198720932007, - "train/negative_loss": 2.7939453125, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.007253373973071575, - "train/total_loss": 0.8441758155822754 + "train/classification_loss": 0.3072069585323334, + "train/contrastive_loss": 2.5616800785064697, + "train/negative_loss": 2.141780138015747, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.41989991068840027, + "train/total_loss": 0.8195430040359497 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2946408689022064, - "train/contrastive_loss": 2.5486350059509277, - "train/negative_loss": 1.7673654556274414, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7812696099281311, - "train/total_loss": 0.8043678998947144 + "train/classification_loss": 0.3118622303009033, + "train/contrastive_loss": 4.651161193847656, + "train/negative_loss": 3.265319585800171, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.385841727256775, + "train/total_loss": 1.2420945167541504 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.296133816242218, - "train/contrastive_loss": 4.4894490242004395, - "train/negative_loss": 4.13041353225708, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.3590353727340698, - "train/total_loss": 1.194023609161377 + "train/classification_loss": 0.31704023480415344, + "train/contrastive_loss": 2.5177791118621826, + "train/negative_loss": 2.467808485031128, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.049970537424087524, + "train/total_loss": 0.8205960988998413 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30204591155052185, - "train/contrastive_loss": 3.3057894706726074, - "train/negative_loss": 2.9320380687713623, + "train/classification_loss": 0.2948223352432251, + "train/contrastive_loss": 0.7317419648170471, + "train/negative_loss": 0.5935785174369812, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.3737514019012451, - "train/total_loss": 0.9632037878036499 + "train/num_positives": 16, + "train/positive_loss": 0.13816343247890472, + "train/total_loss": 0.44117075204849243 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2780458927154541, - "train/contrastive_loss": 3.9225244522094727, - "train/negative_loss": 3.885406017303467, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.03711840882897377, - "train/total_loss": 1.0625507831573486 + "train/classification_loss": 0.3094301223754883, + "train/contrastive_loss": 2.8702237606048584, + "train/negative_loss": 2.7152650356292725, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.15495876967906952, + "train/total_loss": 0.8834748864173889 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3283763825893402, - "train/contrastive_loss": 3.511981964111328, - "train/negative_loss": 3.296717882156372, + "train/classification_loss": 0.3186941146850586, + "train/contrastive_loss": 3.375020980834961, + "train/negative_loss": 3.3734092712402344, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.21526405215263367, - "train/total_loss": 1.0307728052139282 + "train/num_positives": 2, + "train/positive_loss": 0.0016116963233798742, + "train/total_loss": 0.9936982989311218 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2980087399482727, - "train/contrastive_loss": 5.18324089050293, - "train/negative_loss": 5.179697036743164, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.003543616272509098, - "train/total_loss": 1.3346569538116455 + "train/classification_loss": 0.2759850323200226, + "train/contrastive_loss": 2.366849899291992, + "train/negative_loss": 2.1227517127990723, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.2440982311964035, + "train/total_loss": 0.7493550181388855 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.26877525448799133, - "train/contrastive_loss": 2.668714761734009, - "train/negative_loss": 2.0478734970092773, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6208412051200867, - "train/total_loss": 0.8025182485580444 + "train/classification_loss": 0.30546504259109497, + "train/contrastive_loss": 3.506561279296875, + "train/negative_loss": 3.472888946533203, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.03367223963141441, + "train/total_loss": 1.006777286529541 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.2906784117221832, - "train/contrastive_loss": 2.675349473953247, - "train/negative_loss": 2.5713350772857666, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.10401449352502823, - "train/total_loss": 0.8257483243942261 + "train/classification_loss": 0.33961692452430725, + "train/contrastive_loss": 3.1121997833251953, + "train/negative_loss": 2.3136544227600098, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.798545241355896, + "train/total_loss": 0.9620568752288818 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3124653100967407, - "train/contrastive_loss": 4.070686340332031, - "train/negative_loss": 3.1573219299316406, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9133642911911011, - "train/total_loss": 1.1266026496887207 + "train/classification_loss": 0.2976114749908447, + "train/contrastive_loss": 4.00618839263916, + "train/negative_loss": 4.005701541900635, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0004868100513704121, + "train/total_loss": 1.0988491773605347 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.30095839500427246, - "train/contrastive_loss": 2.7330963611602783, - "train/negative_loss": 2.5693202018737793, + "train/classification_loss": 0.3231847584247589, + "train/contrastive_loss": 1.5908297300338745, + "train/negative_loss": 1.5669194459915161, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.1637762039899826, - "train/total_loss": 0.847577691078186 + "train/positive_loss": 0.02391027845442295, + "train/total_loss": 0.6413507461547852 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3062559962272644, - "train/contrastive_loss": 1.3834869861602783, - "train/negative_loss": 1.381471872329712, + "train/classification_loss": 0.31038302183151245, + "train/contrastive_loss": 2.4374196529388428, + "train/negative_loss": 2.419769048690796, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.002015161095187068, - "train/total_loss": 0.5829533934593201 + "train/num_positives": 8, + "train/positive_loss": 0.017650671303272247, + "train/total_loss": 0.797866940498352 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.27228766679763794, - "train/contrastive_loss": 3.6553242206573486, - "train/negative_loss": 3.6182351112365723, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.03708910942077637, - "train/total_loss": 1.0033525228500366 + "train/classification_loss": 0.2667391896247864, + "train/contrastive_loss": 2.343015193939209, + "train/negative_loss": 2.3206093311309814, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.022405769675970078, + "train/total_loss": 0.735342264175415 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3059760332107544, - "train/contrastive_loss": 2.6152610778808594, - "train/negative_loss": 2.567004680633545, - "train/num_negatives": 46, + "train/classification_loss": 0.32684218883514404, + "train/contrastive_loss": 1.964792013168335, + "train/negative_loss": 1.7444849014282227, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.04825642332434654, - "train/total_loss": 0.8290282487869263 + "train/positive_loss": 0.22030705213546753, + "train/total_loss": 0.719800591468811 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.3446093797683716, - "train/contrastive_loss": 2.5056025981903076, - "train/negative_loss": 2.5056025981903076, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.8457298874855042 + "train/classification_loss": 0.3296954929828644, + "train/contrastive_loss": 3.6302342414855957, + "train/negative_loss": 2.858065128326416, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.7721689939498901, + "train/total_loss": 1.0557423830032349 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "eval_exact_match_accuracy": 0.0, - "eval_hamming_loss": 0.09837535014005602, - "eval_loss": 0.8820907473564148, - "eval_macro_f1": 0.0005656108597285068, + "eval_hamming_loss": 0.09720925407199917, + "eval_loss": 0.8579484224319458, + "eval_macro_f1": 0.0006033182503770739, "eval_macro_precision": 0.058823529411764705, - "eval_macro_recall": 0.0002841716396703609, - "eval_micro_f1": 0.0022727272727272726, + "eval_macro_recall": 0.00030321406913280777, + "eval_micro_f1": 0.002129925452609159, "eval_micro_precision": 1.0, - "eval_micro_recall": 0.0011376564277588168, - "eval_runtime": 2.6343, - "eval_samples_per_second": 199.295, - "eval_steps_per_second": 25.054, + "eval_micro_recall": 0.0010660980810234541, + "eval_runtime": 2.8413, + "eval_samples_per_second": 199.558, + "eval_steps_per_second": 24.989, "step": 300 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.27910444140434265, - "train/contrastive_loss": 1.411466121673584, - "train/negative_loss": 1.242889165878296, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1685769259929657, - "train/total_loss": 0.5613976716995239 + "train/classification_loss": 0.2964499294757843, + "train/contrastive_loss": 2.260348320007324, + "train/negative_loss": 1.5223454236984253, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.7380029559135437, + "train/total_loss": 0.7485195994377136 }, { - "epoch": 1.1406844106463878, + "epoch": 1.056338028169014, "step": 300, - "train/classification_loss": 0.34426289796829224, - "train/contrastive_loss": 2.715529441833496, - "train/negative_loss": 1.3187447786331177, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.396784782409668, - "train/total_loss": 0.8873687982559204 + "train/classification_loss": 0.3303905427455902, + "train/contrastive_loss": 2.6616411209106445, + "train/negative_loss": 1.471295952796936, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.190345048904419, + "train/total_loss": 0.8627188205718994 }, { - "epoch": 1.3307984790874525, - "grad_norm": 18.043262481689453, - "learning_rate": 1.996240487062405e-05, - "loss": 1.2439, + "epoch": 1.232394366197183, + "grad_norm": 22.85978889465332, + "learning_rate": 1.9965186751233265e-05, + "loss": 1.2471, "step": 350 }, { - "epoch": 1.3307984790874525, + "epoch": 1.232394366197183, "step": 350, - "train/classification_loss": 0.26427382230758667, - "train/contrastive_loss": 1.134790062904358, - "train/negative_loss": 0.9394581913948059, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.19533191621303558, - "train/total_loss": 0.49123185873031616 + "train/classification_loss": 0.2880552113056183, + "train/contrastive_loss": 1.1895866394042969, + "train/negative_loss": 1.1130249500274658, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.07656171917915344, + "train/total_loss": 0.5259725451469421 }, { - "epoch": 1.3307984790874525, + "epoch": 1.232394366197183, "step": 350, - "train/classification_loss": 0.2695280909538269, - "train/contrastive_loss": 1.262587308883667, - "train/negative_loss": 1.015742301940918, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.24684500694274902, - "train/total_loss": 0.5220455527305603 + "train/classification_loss": 0.26903045177459717, + "train/contrastive_loss": 1.6373264789581299, + "train/negative_loss": 0.9257901310920715, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.7115364074707031, + "train/total_loss": 0.5964957475662231 }, { - "epoch": 1.5209125475285172, - "grad_norm": 17.234338760375977, - "learning_rate": 1.9954794520547948e-05, - "loss": 1.1991, + "epoch": 1.408450704225352, + "grad_norm": 21.00748062133789, + "learning_rate": 1.9958139534883723e-05, + "loss": 1.2271, "step": 400 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3130839169025421, - "train/contrastive_loss": 1.7824201583862305, - "train/negative_loss": 1.3832169771194458, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.39920324087142944, - "train/total_loss": 0.6695679426193237 + "train/classification_loss": 0.28314051032066345, + "train/contrastive_loss": 3.6485836505889893, + "train/negative_loss": 3.6469433307647705, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.0016404222697019577, + "train/total_loss": 1.01285719871521 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2885851263999939, - "train/contrastive_loss": 2.799382448196411, - "train/negative_loss": 2.089852809906006, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.7095296382904053, - "train/total_loss": 0.8484616279602051 + "train/classification_loss": 0.35745859146118164, + "train/contrastive_loss": 1.6834310293197632, + "train/negative_loss": 1.6269944906234741, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.05643654987215996, + "train/total_loss": 0.6941448450088501 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2638190686702728, - "train/contrastive_loss": 3.016111373901367, - "train/negative_loss": 1.4684597253799438, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.5476516485214233, - "train/total_loss": 0.8670413494110107 + "train/classification_loss": 0.3006758391857147, + "train/contrastive_loss": 4.145646572113037, + "train/negative_loss": 2.6357791423797607, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.509867548942566, + "train/total_loss": 1.1298052072525024 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2644801735877991, - "train/contrastive_loss": 3.1516568660736084, - "train/negative_loss": 2.6517927646636963, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.49986404180526733, - "train/total_loss": 0.8948115706443787 + "train/classification_loss": 0.22981052100658417, + "train/contrastive_loss": 2.5373754501342773, + "train/negative_loss": 2.4768316745758057, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.060543760657310486, + "train/total_loss": 0.7372856140136719 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.30244559049606323, - "train/contrastive_loss": 2.1174185276031494, - "train/negative_loss": 1.9102649688720703, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.20715346932411194, - "train/total_loss": 0.7259292602539062 + "train/classification_loss": 0.2808890640735626, + "train/contrastive_loss": 3.290686845779419, + "train/negative_loss": 3.189662218093872, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.1010245680809021, + "train/total_loss": 0.9390264749526978 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28559616208076477, - "train/contrastive_loss": 2.0670104026794434, - "train/negative_loss": 1.938764214515686, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.12824606895446777, - "train/total_loss": 0.698998212814331 + "train/classification_loss": 0.2821494936943054, + "train/contrastive_loss": 3.2997570037841797, + "train/negative_loss": 2.7153472900390625, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.5844097137451172, + "train/total_loss": 0.9421008825302124 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3234643340110779, - "train/contrastive_loss": 1.8243683576583862, - "train/negative_loss": 1.778984785079956, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.045383598655462265, - "train/total_loss": 0.688338041305542 + "train/classification_loss": 0.2745994031429291, + "train/contrastive_loss": 2.316945791244507, + "train/negative_loss": 2.0420944690704346, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.27485138177871704, + "train/total_loss": 0.7379885911941528 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.23712889850139618, - "train/contrastive_loss": 1.7636357545852661, - "train/negative_loss": 1.2017720937728882, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5618636608123779, - "train/total_loss": 0.5898560285568237 + "train/classification_loss": 0.31354820728302, + "train/contrastive_loss": 2.1877691745758057, + "train/negative_loss": 2.187727212905884, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 4.1962550312746316e-05, + "train/total_loss": 0.751102089881897 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2554152309894562, - "train/contrastive_loss": 1.437118649482727, - "train/negative_loss": 1.4297376871109009, + "train/classification_loss": 0.27818140387535095, + "train/contrastive_loss": 2.015977382659912, + "train/negative_loss": 1.615659236907959, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.007380938157439232, - "train/total_loss": 0.5428389310836792 + "train/positive_loss": 0.4003180265426636, + "train/total_loss": 0.6813768744468689 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3288363814353943, - "train/contrastive_loss": 3.561093807220459, - "train/negative_loss": 2.317636013031006, + "train/classification_loss": 0.29782742261886597, + "train/contrastive_loss": 3.6882712841033936, + "train/negative_loss": 2.3672292232513428, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2434579133987427, - "train/total_loss": 1.0410552024841309 + "train/num_positives": 14, + "train/positive_loss": 1.3210420608520508, + "train/total_loss": 1.0354816913604736 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.27076956629753113, - "train/contrastive_loss": 2.1460652351379395, - "train/negative_loss": 2.080864667892456, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.06520066410303116, - "train/total_loss": 0.6999826431274414 + "train/classification_loss": 0.2708834409713745, + "train/contrastive_loss": 1.884966254234314, + "train/negative_loss": 1.7773405313491821, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.10762572288513184, + "train/total_loss": 0.6478767395019531 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2500836253166199, - "train/contrastive_loss": 1.3183083534240723, - "train/negative_loss": 1.2435946464538574, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.07471369951963425, - "train/total_loss": 0.5137453079223633 + "train/classification_loss": 0.2913475036621094, + "train/contrastive_loss": 2.8310608863830566, + "train/negative_loss": 2.1860485076904297, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6450124382972717, + "train/total_loss": 0.8575596809387207 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28650963306427, - "train/contrastive_loss": 3.820486307144165, - "train/negative_loss": 3.1066625118255615, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7138238549232483, - "train/total_loss": 1.0506069660186768 + "train/classification_loss": 0.2809962034225464, + "train/contrastive_loss": 4.520957946777344, + "train/negative_loss": 3.2867579460144043, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.2342002391815186, + "train/total_loss": 1.185187816619873 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.26550403237342834, - "train/contrastive_loss": 2.156113386154175, - "train/negative_loss": 2.154571294784546, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0015421150019392371, - "train/total_loss": 0.6967266798019409 + "train/classification_loss": 0.3250114917755127, + "train/contrastive_loss": 6.256960868835449, + "train/negative_loss": 2.8978018760681152, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 3.359158992767334, + "train/total_loss": 1.5764037370681763 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.24077241122722626, - "train/contrastive_loss": 2.027468681335449, - "train/negative_loss": 1.9469760656356812, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.0804925337433815, - "train/total_loss": 0.6462661623954773 + "train/classification_loss": 0.21937939524650574, + "train/contrastive_loss": 2.758821725845337, + "train/negative_loss": 2.2684803009033203, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.4903413653373718, + "train/total_loss": 0.7711437940597534 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2602681815624237, - "train/contrastive_loss": 1.577919602394104, - "train/negative_loss": 1.5463966131210327, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.031522974371910095, - "train/total_loss": 0.57585209608078 + "train/classification_loss": 0.2930915057659149, + "train/contrastive_loss": 3.8704781532287598, + "train/negative_loss": 3.289940357208252, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.5805377960205078, + "train/total_loss": 1.0671871900558472 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3029567003250122, - "train/contrastive_loss": 2.4382457733154297, - "train/negative_loss": 2.0572423934936523, - "train/num_negatives": 40, + "train/classification_loss": 0.2719612121582031, + "train/contrastive_loss": 2.343186855316162, + "train/negative_loss": 2.2578723430633545, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.38100340962409973, - "train/total_loss": 0.790605902671814 + "train/positive_loss": 0.0853145644068718, + "train/total_loss": 0.7405985593795776 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.327029287815094, - "train/contrastive_loss": 2.130749225616455, - "train/negative_loss": 1.3067207336425781, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.824028491973877, - "train/total_loss": 0.753179132938385 + "train/classification_loss": 0.2838720381259918, + "train/contrastive_loss": 4.29950475692749, + "train/negative_loss": 2.86482572555542, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.4346790313720703, + "train/total_loss": 1.1437729597091675 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3177184462547302, - "train/contrastive_loss": 1.9496716260910034, - "train/negative_loss": 1.94253408908844, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.007137560751289129, - "train/total_loss": 0.7076528072357178 + "train/classification_loss": 0.3134099245071411, + "train/contrastive_loss": 1.483730673789978, + "train/negative_loss": 1.449765682220459, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.03396494314074516, + "train/total_loss": 0.6101560592651367 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.26200923323631287, - "train/contrastive_loss": 2.975144863128662, - "train/negative_loss": 2.5689032077789307, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4062417149543762, - "train/total_loss": 0.8570382595062256 + "train/classification_loss": 0.2442343682050705, + "train/contrastive_loss": 2.234797954559326, + "train/negative_loss": 2.1959829330444336, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.03881501033902168, + "train/total_loss": 0.6911939382553101 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3143180310726166, - "train/contrastive_loss": 2.9048967361450195, - "train/negative_loss": 1.8205244541168213, - "train/num_negatives": 44, + "train/classification_loss": 0.25493910908699036, + "train/contrastive_loss": 1.4183422327041626, + "train/negative_loss": 1.3800286054611206, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.0843722820281982, - "train/total_loss": 0.8952974081039429 + "train/positive_loss": 0.03831358626484871, + "train/total_loss": 0.5386075973510742 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3347070813179016, - "train/contrastive_loss": 2.288820505142212, - "train/negative_loss": 2.2854511737823486, - "train/num_negatives": 44, + "train/classification_loss": 0.2346188873052597, + "train/contrastive_loss": 2.815380811691284, + "train/negative_loss": 2.572707176208496, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.0033694207668304443, - "train/total_loss": 0.792471170425415 + "train/positive_loss": 0.24267353117465973, + "train/total_loss": 0.7976951003074646 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2514670193195343, - "train/contrastive_loss": 1.2011758089065552, - "train/negative_loss": 1.0148028135299683, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.1863730400800705, - "train/total_loss": 0.49170219898223877 + "train/classification_loss": 0.2991984188556671, + "train/contrastive_loss": 4.171680450439453, + "train/negative_loss": 1.799856185913086, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 2.371824264526367, + "train/total_loss": 1.133534550666809 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.24096502363681793, - "train/contrastive_loss": 1.5410733222961426, - "train/negative_loss": 1.1118245124816895, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.4292488098144531, - "train/total_loss": 0.5491796731948853 + "train/classification_loss": 0.3120678663253784, + "train/contrastive_loss": 2.901266098022461, + "train/negative_loss": 2.0078399181365967, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.8934262990951538, + "train/total_loss": 0.8923211097717285 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.21912460029125214, - "train/contrastive_loss": 2.416769027709961, - "train/negative_loss": 2.4099948406219482, + "train/classification_loss": 0.29216432571411133, + "train/contrastive_loss": 2.6716737747192383, + "train/negative_loss": 1.666440486907959, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.006774227600544691, - "train/total_loss": 0.7024784088134766 + "train/num_positives": 10, + "train/positive_loss": 1.0052334070205688, + "train/total_loss": 0.8264991044998169 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3117242157459259, - "train/contrastive_loss": 1.9101349115371704, - "train/negative_loss": 0.5341365337371826, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3759983777999878, - "train/total_loss": 0.6937512159347534 + "train/classification_loss": 0.27575424313545227, + "train/contrastive_loss": 3.7175068855285645, + "train/negative_loss": 2.7596592903137207, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9578475952148438, + "train/total_loss": 1.0192556381225586 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2965089678764343, - "train/contrastive_loss": 1.8907849788665771, - "train/negative_loss": 1.8753217458724976, + "train/classification_loss": 0.2976415455341339, + "train/contrastive_loss": 2.7999374866485596, + "train/negative_loss": 2.7792277336120605, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.015463270246982574, - "train/total_loss": 0.6746659278869629 + "train/num_positives": 4, + "train/positive_loss": 0.020709799602627754, + "train/total_loss": 0.8576290607452393 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2969740033149719, - "train/contrastive_loss": 2.611759901046753, - "train/negative_loss": 2.179718255996704, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.43204164505004883, - "train/total_loss": 0.8193259835243225 + "train/classification_loss": 0.29993757605552673, + "train/contrastive_loss": 0.8771870732307434, + "train/negative_loss": 0.8421351909637451, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.0350518561899662, + "train/total_loss": 0.4753749966621399 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.29800960421562195, - "train/contrastive_loss": 1.4127709865570068, - "train/negative_loss": 1.3993638753890991, - "train/num_negatives": 40, + "train/classification_loss": 0.280966192483902, + "train/contrastive_loss": 3.608607769012451, + "train/negative_loss": 2.94978404045105, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.013407165184617043, - "train/total_loss": 0.5805637836456299 + "train/positive_loss": 0.6588236689567566, + "train/total_loss": 1.0026878118515015 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.31452056765556335, - "train/contrastive_loss": 3.9774842262268066, - "train/negative_loss": 2.7785239219665527, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 1.198960304260254, - "train/total_loss": 1.1100174188613892 + "train/classification_loss": 0.32713279128074646, + "train/contrastive_loss": 1.831444501876831, + "train/negative_loss": 1.7606438398361206, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.07080063968896866, + "train/total_loss": 0.6934217214584351 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2927503287792206, - "train/contrastive_loss": 2.5104503631591797, - "train/negative_loss": 1.3983690738677979, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.1120812892913818, - "train/total_loss": 0.7948404550552368 + "train/classification_loss": 0.24486862123012543, + "train/contrastive_loss": 1.659805178642273, + "train/negative_loss": 1.6573882102966309, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0024170209653675556, + "train/total_loss": 0.5768296718597412 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28147438168525696, - "train/contrastive_loss": 2.2251832485198975, - "train/negative_loss": 1.7999745607376099, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.42520877718925476, - "train/total_loss": 0.7265110015869141 + "train/classification_loss": 0.2733094394207001, + "train/contrastive_loss": 4.90904426574707, + "train/negative_loss": 3.468482494354248, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.4405617713928223, + "train/total_loss": 1.2551182508468628 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3430488705635071, - "train/contrastive_loss": 1.9732694625854492, - "train/negative_loss": 1.9727033376693726, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005661062896251678, - "train/total_loss": 0.7377027273178101 + "train/classification_loss": 0.28643983602523804, + "train/contrastive_loss": 3.4082577228546143, + "train/negative_loss": 2.7432756423950195, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.66498202085495, + "train/total_loss": 0.9680913686752319 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3026675879955292, - "train/contrastive_loss": 2.1712801456451416, - "train/negative_loss": 1.6062854528427124, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.5649946928024292, - "train/total_loss": 0.7369236350059509 + "train/classification_loss": 0.29841044545173645, + "train/contrastive_loss": 2.4200477600097656, + "train/negative_loss": 2.043607473373413, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.37644028663635254, + "train/total_loss": 0.7824200391769409 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28055405616760254, - "train/contrastive_loss": 3.234975814819336, - "train/negative_loss": 2.721615791320801, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5133600234985352, - "train/total_loss": 0.9275492429733276 + "train/classification_loss": 0.3234871029853821, + "train/contrastive_loss": 4.502335548400879, + "train/negative_loss": 3.422264575958252, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.080070972442627, + "train/total_loss": 1.223954200744629 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.25944212079048157, - "train/contrastive_loss": 4.497574806213379, - "train/negative_loss": 2.591249942779541, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.906324863433838, - "train/total_loss": 1.1589571237564087 + "train/classification_loss": 0.23264829814434052, + "train/contrastive_loss": 3.969658136367798, + "train/negative_loss": 3.4609906673431396, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5086674690246582, + "train/total_loss": 1.0265799760818481 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.27296850085258484, - "train/contrastive_loss": 3.3886611461639404, - "train/negative_loss": 3.262725830078125, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.12593528628349304, - "train/total_loss": 0.9507007598876953 + "train/classification_loss": 0.2903940677642822, + "train/contrastive_loss": 2.3835885524749756, + "train/negative_loss": 2.3447093963623047, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.03887925297021866, + "train/total_loss": 0.7671117782592773 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2657545804977417, - "train/contrastive_loss": 2.3722457885742188, - "train/negative_loss": 1.7828987836837769, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.5893470644950867, - "train/total_loss": 0.7402037382125854 + "train/classification_loss": 0.35945478081703186, + "train/contrastive_loss": 5.76614236831665, + "train/negative_loss": 5.759280204772949, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.006862022913992405, + "train/total_loss": 1.5126832723617554 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2989766001701355, - "train/contrastive_loss": 1.5411498546600342, - "train/negative_loss": 1.4941036701202393, - "train/num_negatives": 46, + "train/classification_loss": 0.2925422787666321, + "train/contrastive_loss": 1.3959766626358032, + "train/negative_loss": 1.1795071363449097, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.21646957099437714, + "train/total_loss": 0.5717376470565796 + }, + { + "epoch": 1.408450704225352, + "step": 400, + "train/classification_loss": 0.30739670991897583, + "train/contrastive_loss": 4.221601486206055, + "train/negative_loss": 4.039336681365967, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.04704619199037552, - "train/total_loss": 0.6072065830230713 + "train/positive_loss": 0.18226470053195953, + "train/total_loss": 1.151716947555542 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2826122045516968, - "train/contrastive_loss": 2.916254758834839, - "train/negative_loss": 2.9154655933380127, + "train/classification_loss": 0.24188092350959778, + "train/contrastive_loss": 2.5173935890197754, + "train/negative_loss": 2.0494346618652344, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0007892384310252964, - "train/total_loss": 0.8658631443977356 + "train/num_positives": 10, + "train/positive_loss": 0.467958927154541, + "train/total_loss": 0.7453596591949463 + }, + { + "epoch": 1.408450704225352, + "step": 400, + "train/classification_loss": 0.25453948974609375, + "train/contrastive_loss": 5.941244125366211, + "train/negative_loss": 4.527768611907959, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.4134756326675415, + "train/total_loss": 1.4427883625030518 + }, + { + "epoch": 1.408450704225352, + "step": 400, + "train/classification_loss": 0.31516823172569275, + "train/contrastive_loss": 2.153377056121826, + "train/negative_loss": 2.133862018585205, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.01951492205262184, + "train/total_loss": 0.7458436489105225 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2651289701461792, - "train/contrastive_loss": 1.491920828819275, - "train/negative_loss": 1.4197415113449097, + "train/classification_loss": 0.2895812392234802, + "train/contrastive_loss": 3.385507345199585, + "train/negative_loss": 3.381545305252075, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.07217933237552643, - "train/total_loss": 0.5635131597518921 + "train/positive_loss": 0.003962024115025997, + "train/total_loss": 0.9666827321052551 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2676490843296051, - "train/contrastive_loss": 2.4212470054626465, - "train/negative_loss": 2.378061532974243, - "train/num_negatives": 36, + "train/classification_loss": 0.29960328340530396, + "train/contrastive_loss": 2.3431429862976074, + "train/negative_loss": 1.7375675439834595, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.6055755615234375, + "train/total_loss": 0.7682318687438965 + }, + { + "epoch": 1.408450704225352, + "step": 400, + "train/classification_loss": 0.34186220169067383, + "train/contrastive_loss": 4.986680507659912, + "train/negative_loss": 4.8491291999816895, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.04318556562066078, - "train/total_loss": 0.7518985271453857 + "train/positive_loss": 0.13755129277706146, + "train/total_loss": 1.339198350906372 + }, + { + "epoch": 1.408450704225352, + "step": 400, + "train/classification_loss": 0.2666102647781372, + "train/contrastive_loss": 4.593352317810059, + "train/negative_loss": 2.2988717555999756, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.294480800628662, + "train/total_loss": 1.1852807998657227 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.30975139141082764, - "train/contrastive_loss": 2.5920569896698, - "train/negative_loss": 2.2571537494659424, + "train/classification_loss": 0.28822842240333557, + "train/contrastive_loss": 2.5433995723724365, + "train/negative_loss": 2.4596502780914307, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.3349032402038574, - "train/total_loss": 0.8281627893447876 + "train/num_positives": 14, + "train/positive_loss": 0.08374931663274765, + "train/total_loss": 0.7969083786010742 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2641478180885315, - "train/contrastive_loss": 3.0395798683166504, - "train/negative_loss": 2.4060957431793213, + "train/classification_loss": 0.3163786232471466, + "train/contrastive_loss": 2.4625463485717773, + "train/negative_loss": 2.4441275596618652, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6334841847419739, - "train/total_loss": 0.8720638155937195 + "train/num_positives": 2, + "train/positive_loss": 0.018418695777654648, + "train/total_loss": 0.8088878989219666 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2527199983596802, - "train/contrastive_loss": 1.4782119989395142, - "train/negative_loss": 0.9848592877388, + "train/classification_loss": 0.2659255862236023, + "train/contrastive_loss": 2.0809900760650635, + "train/negative_loss": 1.687066674232483, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4933527410030365, - "train/total_loss": 0.5483623743057251 + "train/num_positives": 16, + "train/positive_loss": 0.3939233124256134, + "train/total_loss": 0.682123601436615 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3391089141368866, - "train/contrastive_loss": 1.790329098701477, - "train/negative_loss": 1.743017554283142, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.04731154441833496, - "train/total_loss": 0.6971747279167175 + "train/classification_loss": 0.3270394504070282, + "train/contrastive_loss": 2.4765117168426514, + "train/negative_loss": 2.187736988067627, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.28877466917037964, + "train/total_loss": 0.822341799736023 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2502748370170593, - "train/contrastive_loss": 1.6319578886032104, - "train/negative_loss": 1.631218671798706, - "train/num_negatives": 48, + "train/classification_loss": 0.3214586079120636, + "train/contrastive_loss": 2.243574619293213, + "train/negative_loss": 2.226280927658081, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0007392129627987742, - "train/total_loss": 0.5766664147377014 + "train/positive_loss": 0.017293790355324745, + "train/total_loss": 0.7701735496520996 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28242114186286926, - "train/contrastive_loss": 0.6333229541778564, - "train/negative_loss": 0.35982316732406616, + "train/classification_loss": 0.2980997860431671, + "train/contrastive_loss": 1.4891579151153564, + "train/negative_loss": 1.262666940689087, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.27349981665611267, - "train/total_loss": 0.409085750579834 + "train/num_positives": 14, + "train/positive_loss": 0.22649097442626953, + "train/total_loss": 0.5959314107894897 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.26124870777130127, - "train/contrastive_loss": 2.5064175128936768, - "train/negative_loss": 2.492769479751587, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.013648087158799171, - "train/total_loss": 0.7625322341918945 + "train/classification_loss": 0.3622506260871887, + "train/contrastive_loss": 3.5721888542175293, + "train/negative_loss": 3.4855449199676514, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.08664385974407196, + "train/total_loss": 1.0766884088516235 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.32650408148765564, - "train/contrastive_loss": 0.877875804901123, - "train/negative_loss": 0.8247732520103455, - "train/num_negatives": 28, + "train/classification_loss": 0.2531818449497223, + "train/contrastive_loss": 2.639148235321045, + "train/negative_loss": 2.637859344482422, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.053102537989616394, - "train/total_loss": 0.5020792484283447 + "train/positive_loss": 0.0012888265773653984, + "train/total_loss": 0.7810114622116089 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.29279547929763794, - "train/contrastive_loss": 3.2104902267456055, - "train/negative_loss": 2.1327273845672607, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0777629613876343, - "train/total_loss": 0.9348935484886169 + "train/classification_loss": 0.2568850815296173, + "train/contrastive_loss": 2.1130855083465576, + "train/negative_loss": 1.893040657043457, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.22004477679729462, + "train/total_loss": 0.6795021891593933 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2651278078556061, - "train/contrastive_loss": 2.378021478652954, - "train/negative_loss": 2.3742973804473877, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0037241321988403797, - "train/total_loss": 0.7407320737838745 + "train/classification_loss": 0.28819215297698975, + "train/contrastive_loss": 3.1632916927337646, + "train/negative_loss": 3.134622812271118, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.02866896614432335, + "train/total_loss": 0.9208505153656006 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.27547386288642883, - "train/contrastive_loss": 2.2212162017822266, - "train/negative_loss": 1.3908841609954834, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8303321599960327, - "train/total_loss": 0.7197171449661255 + "train/classification_loss": 0.292076051235199, + "train/contrastive_loss": 5.979118347167969, + "train/negative_loss": 3.3803794384002686, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 2.5987389087677, + "train/total_loss": 1.4878997802734375 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.28208738565444946, - "train/contrastive_loss": 3.892136573791504, - "train/negative_loss": 3.3745920658111572, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5175445079803467, - "train/total_loss": 1.0605146884918213 + "train/classification_loss": 0.2968142628669739, + "train/contrastive_loss": 2.799877166748047, + "train/negative_loss": 2.6201677322387695, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.17970947921276093, + "train/total_loss": 0.8567897081375122 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2848222553730011, - "train/contrastive_loss": 2.658534526824951, - "train/negative_loss": 1.9752930402755737, + "train/classification_loss": 0.2720637023448944, + "train/contrastive_loss": 1.3613431453704834, + "train/negative_loss": 1.1893391609191895, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.6832413673400879, - "train/total_loss": 0.8165291547775269 + "train/num_positives": 16, + "train/positive_loss": 0.17200396955013275, + "train/total_loss": 0.5443323254585266 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2572706341743469, - "train/contrastive_loss": 3.960623264312744, - "train/negative_loss": 3.6354446411132812, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.3251786231994629, - "train/total_loss": 1.0493953227996826 + "train/classification_loss": 0.2867943346500397, + "train/contrastive_loss": 2.043962001800537, + "train/negative_loss": 1.7115544080734253, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.332407683134079, + "train/total_loss": 0.6955867409706116 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3152223825454712, - "train/contrastive_loss": 3.580897808074951, - "train/negative_loss": 2.307541847229004, + "train/classification_loss": 0.306005597114563, + "train/contrastive_loss": 3.86198091506958, + "train/negative_loss": 3.858013391494751, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.2733559608459473, - "train/total_loss": 1.0314018726348877 + "train/num_positives": 2, + "train/positive_loss": 0.003967516124248505, + "train/total_loss": 1.078401803970337 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.27916914224624634, - "train/contrastive_loss": 3.4964535236358643, - "train/negative_loss": 3.466059446334839, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.030393965542316437, - "train/total_loss": 0.9784598350524902 + "train/classification_loss": 0.2502118945121765, + "train/contrastive_loss": 2.805070400238037, + "train/negative_loss": 2.1969077587127686, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.6081627607345581, + "train/total_loss": 0.8112260103225708 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2471722960472107, - "train/contrastive_loss": 1.85983145236969, - "train/negative_loss": 1.5313163995742798, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.32851505279541016, - "train/total_loss": 0.6191385984420776 + "train/classification_loss": 0.2816160321235657, + "train/contrastive_loss": 3.772751569747925, + "train/negative_loss": 3.761920213699341, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.010831433348357677, + "train/total_loss": 1.0361664295196533 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.27177321910858154, - "train/contrastive_loss": 1.909385085105896, - "train/negative_loss": 1.6199818849563599, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.28940317034721375, - "train/total_loss": 0.6536502838134766 + "train/classification_loss": 0.3179038166999817, + "train/contrastive_loss": 5.492734909057617, + "train/negative_loss": 3.0714924335479736, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 2.4212422370910645, + "train/total_loss": 1.4164507389068604 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2921210825443268, - "train/contrastive_loss": 4.060750484466553, - "train/negative_loss": 3.572638511657715, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.4881119132041931, - "train/total_loss": 1.1042711734771729 + "train/classification_loss": 0.2772493064403534, + "train/contrastive_loss": 2.904123306274414, + "train/negative_loss": 2.869365930557251, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.034757260233163834, + "train/total_loss": 0.8580739498138428 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2858498990535736, - "train/contrastive_loss": 3.071608304977417, - "train/negative_loss": 2.629793643951416, + "train/classification_loss": 0.30459970235824585, + "train/contrastive_loss": 1.9777851104736328, + "train/negative_loss": 1.9691665172576904, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.4418146312236786, - "train/total_loss": 0.9001715183258057 + "train/positive_loss": 0.008618637919425964, + "train/total_loss": 0.7001566886901855 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2894030809402466, - "train/contrastive_loss": 1.3904260396957397, - "train/negative_loss": 1.3895682096481323, + "train/classification_loss": 0.2939474880695343, + "train/contrastive_loss": 3.134911298751831, + "train/negative_loss": 3.0512232780456543, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0008577844128012657, - "train/total_loss": 0.5674883127212524 + "train/num_positives": 8, + "train/positive_loss": 0.0836879089474678, + "train/total_loss": 0.9209297895431519 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2492283135652542, - "train/contrastive_loss": 2.765015125274658, - "train/negative_loss": 2.665844678878784, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.0991704910993576, - "train/total_loss": 0.8022313117980957 + "train/classification_loss": 0.2405194342136383, + "train/contrastive_loss": 2.8466434478759766, + "train/negative_loss": 2.642735719680786, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.203907772898674, + "train/total_loss": 0.8098481893539429 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2892957329750061, - "train/contrastive_loss": 1.8207976818084717, - "train/negative_loss": 1.8046183586120605, - "train/num_negatives": 46, + "train/classification_loss": 0.31088942289352417, + "train/contrastive_loss": 3.955350875854492, + "train/negative_loss": 2.314692735671997, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.016179274767637253, - "train/total_loss": 0.6534552574157715 + "train/positive_loss": 1.6406581401824951, + "train/total_loss": 1.1019595861434937 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.3328791856765747, - "train/contrastive_loss": 2.1411972045898438, - "train/negative_loss": 2.1411972045898438, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.7611186504364014 - }, - { - "epoch": 1.5209125475285172, - "eval_exact_match_accuracy": 0.02857142857142857, - "eval_hamming_loss": 0.09366946778711485, - "eval_loss": 0.7624192237854004, - "eval_macro_f1": 0.020235294117647056, + "train/classification_loss": 0.3126649260520935, + "train/contrastive_loss": 3.1432363986968994, + "train/negative_loss": 2.495011329650879, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.6482250690460205, + "train/total_loss": 0.9413121938705444 + }, + { + "epoch": 1.408450704225352, + "eval_exact_match_accuracy": 0.007054673721340388, + "eval_hamming_loss": 0.09627554725593941, + "eval_loss": 0.9071576595306396, + "eval_macro_f1": 0.0057670126874279125, "eval_macro_precision": 0.058823529411764705, - "eval_macro_recall": 0.012219380505825519, - "eval_micro_f1": 0.09327548806941431, + "eval_macro_recall": 0.0030321406913280773, + "eval_micro_f1": 0.02109704641350211, "eval_micro_precision": 1.0, - "eval_micro_recall": 0.048919226393629126, - "eval_runtime": 2.6322, - "eval_samples_per_second": 199.449, - "eval_steps_per_second": 25.074, + "eval_micro_recall": 0.010660980810234541, + "eval_runtime": 2.8429, + "eval_samples_per_second": 199.446, + "eval_steps_per_second": 24.975, "step": 400 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.26936665177345276, - "train/contrastive_loss": 2.2238264083862305, - "train/negative_loss": 1.1791372299194336, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.0446891784667969, - "train/total_loss": 0.7141319513320923 + "train/classification_loss": 0.3063514828681946, + "train/contrastive_loss": 0.9124388694763184, + "train/negative_loss": 0.6337320804595947, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.27870678901672363, + "train/total_loss": 0.4888392686843872 }, { - "epoch": 1.5209125475285172, + "epoch": 1.408450704225352, "step": 400, - "train/classification_loss": 0.2763923406600952, - "train/contrastive_loss": 1.6629462242126465, - "train/negative_loss": 1.0876610279083252, + "train/classification_loss": 0.28292348980903625, + "train/contrastive_loss": 1.2839583158493042, + "train/negative_loss": 1.1856136322021484, "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.5752851963043213, - "train/total_loss": 0.6089816093444824 + "train/positive_loss": 0.09834469854831696, + "train/total_loss": 0.5397151708602905 }, { - "epoch": 1.7110266159695817, - "grad_norm": 15.384295463562012, - "learning_rate": 1.9947184170471842e-05, - "loss": 1.1836, + "epoch": 1.584507042253521, + "grad_norm": 20.219684600830078, + "learning_rate": 1.995123326286117e-05, + "loss": 1.1671, "step": 450 }, { - "epoch": 1.7110266159695817, + "epoch": 1.584507042253521, "step": 450, - "train/classification_loss": 0.28599080443382263, - "train/contrastive_loss": 2.236501693725586, - "train/negative_loss": 1.4360575675964355, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.8004441261291504, - "train/total_loss": 0.7332911491394043 + "train/classification_loss": 0.2751622498035431, + "train/contrastive_loss": 1.8498551845550537, + "train/negative_loss": 0.8557652235031128, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9940899014472961, + "train/total_loss": 0.6451332569122314 }, { - "epoch": 1.7110266159695817, + "epoch": 1.584507042253521, "step": 450, - "train/classification_loss": 0.2800164520740509, - "train/contrastive_loss": 1.2265368700027466, - "train/negative_loss": 1.1893432140350342, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.037193600088357925, - "train/total_loss": 0.5253238081932068 + "train/classification_loss": 0.2665400803089142, + "train/contrastive_loss": 2.26444673538208, + "train/negative_loss": 1.9925936460494995, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 0.2718530297279358, + "train/total_loss": 0.7194294333457947 }, { - "epoch": 1.9011406844106464, - "grad_norm": 24.527318954467773, - "learning_rate": 1.993957382039574e-05, - "loss": 1.1809, + "epoch": 1.76056338028169, + "grad_norm": 13.850686073303223, + "learning_rate": 1.994418604651163e-05, + "loss": 1.1877, "step": 500 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3103904128074646, - "train/contrastive_loss": 2.0892696380615234, - "train/negative_loss": 1.3849194049835205, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.7043501138687134, - "train/total_loss": 0.7282443046569824 + "train/classification_loss": 0.2746850550174713, + "train/contrastive_loss": 2.372941732406616, + "train/negative_loss": 2.345904588699341, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.02703716978430748, + "train/total_loss": 0.749273419380188 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2790190875530243, - "train/contrastive_loss": 2.2548437118530273, - "train/negative_loss": 1.6857163906097412, - "train/num_negatives": 38, + "train/classification_loss": 0.3542173504829407, + "train/contrastive_loss": 1.5934892892837524, + "train/negative_loss": 1.4353690147399902, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.1581203192472458, + "train/total_loss": 0.6729152202606201 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.2922971546649933, + "train/contrastive_loss": 3.7633190155029297, + "train/negative_loss": 2.4660730361938477, + "train/num_negatives": 36, "train/num_positives": 14, - "train/positive_loss": 0.5691274404525757, - "train/total_loss": 0.7299878597259521 + "train/positive_loss": 1.2972458600997925, + "train/total_loss": 1.0449609756469727 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24839375913143158, - "train/contrastive_loss": 2.939049243927002, - "train/negative_loss": 1.9531177282333374, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.985931396484375, - "train/total_loss": 0.8362036347389221 + "train/classification_loss": 0.21439695358276367, + "train/contrastive_loss": 2.3541316986083984, + "train/negative_loss": 1.6336003541946411, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.7205313444137573, + "train/total_loss": 0.6852233409881592 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2511407136917114, - "train/contrastive_loss": 3.147653818130493, - "train/negative_loss": 2.6599295139312744, + "train/classification_loss": 0.2711621820926666, + "train/contrastive_loss": 3.327296733856201, + "train/negative_loss": 3.0933024883270264, "train/num_negatives": 34, "train/num_positives": 18, - "train/positive_loss": 0.48772430419921875, - "train/total_loss": 0.880671501159668 + "train/positive_loss": 0.2339942753314972, + "train/total_loss": 0.9366215467453003 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.28555727005004883, - "train/contrastive_loss": 2.486170768737793, - "train/negative_loss": 2.4159867763519287, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.07018411159515381, - "train/total_loss": 0.7827914357185364 + "train/classification_loss": 0.2754226624965668, + "train/contrastive_loss": 3.468142509460449, + "train/negative_loss": 2.288297176361084, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.1798453330993652, + "train/total_loss": 0.9690511226654053 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.27446457743644714, - "train/contrastive_loss": 2.3979504108428955, - "train/negative_loss": 2.059108018875122, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.33884239196777344, - "train/total_loss": 0.7540546655654907 + "train/classification_loss": 0.2677496671676636, + "train/contrastive_loss": 2.6534390449523926, + "train/negative_loss": 1.895154356956482, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.7582846283912659, + "train/total_loss": 0.7984374761581421 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3162132203578949, - "train/contrastive_loss": 2.1348564624786377, - "train/negative_loss": 1.657476544380188, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.4773799777030945, - "train/total_loss": 0.743184506893158 + "train/classification_loss": 0.3002317249774933, + "train/contrastive_loss": 1.6155636310577393, + "train/negative_loss": 1.6155221462249756, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 4.1485694964649156e-05, + "train/total_loss": 0.6233444213867188 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.22386887669563293, - "train/contrastive_loss": 1.6394387483596802, - "train/negative_loss": 1.3380980491638184, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.30134066939353943, - "train/total_loss": 0.5517566204071045 - }, - { - "epoch": 1.9011406844106464, - "step": 500, - "train/classification_loss": 0.23749828338623047, - "train/contrastive_loss": 1.8424558639526367, - "train/negative_loss": 1.830248475074768, + "train/classification_loss": 0.2563718259334564, + "train/contrastive_loss": 1.2085214853286743, + "train/negative_loss": 1.031713843345642, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.012207399122416973, - "train/total_loss": 0.6059894561767578 + "train/positive_loss": 0.17680767178535461, + "train/total_loss": 0.4980761408805847 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3215911388397217, - "train/contrastive_loss": 3.364527702331543, - "train/negative_loss": 2.467162847518921, + "train/classification_loss": 0.2899928689002991, + "train/contrastive_loss": 3.2499887943267822, + "train/negative_loss": 1.6832780838012695, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8973648548126221, - "train/total_loss": 0.9944967031478882 + "train/num_positives": 14, + "train/positive_loss": 1.5667107105255127, + "train/total_loss": 0.9399906396865845 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.25681617856025696, - "train/contrastive_loss": 2.610225200653076, - "train/negative_loss": 2.296335220336914, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.31388992071151733, - "train/total_loss": 0.7788612842559814 + "train/classification_loss": 0.2547776401042938, + "train/contrastive_loss": 1.6170804500579834, + "train/negative_loss": 1.590372085571289, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.026708392426371574, + "train/total_loss": 0.578193724155426 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.22908297181129456, - "train/contrastive_loss": 1.472802758216858, - "train/negative_loss": 1.3606058359146118, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.1121969074010849, - "train/total_loss": 0.5236434936523438 + "train/classification_loss": 0.27819275856018066, + "train/contrastive_loss": 2.675546169281006, + "train/negative_loss": 1.767678141593933, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.9078681468963623, + "train/total_loss": 0.8133019804954529 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2778133451938629, - "train/contrastive_loss": 3.652531147003174, - "train/negative_loss": 3.285484790802002, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.36704644560813904, - "train/total_loss": 1.008319616317749 + "train/classification_loss": 0.2753927409648895, + "train/contrastive_loss": 5.103810787200928, + "train/negative_loss": 2.7712783813476562, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.3325324058532715, + "train/total_loss": 1.2961549758911133 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24634405970573425, - "train/contrastive_loss": 2.069138526916504, - "train/negative_loss": 2.0678725242614746, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.001265963539481163, - "train/total_loss": 0.6601717472076416 + "train/classification_loss": 0.31207919120788574, + "train/contrastive_loss": 3.9416584968566895, + "train/negative_loss": 2.3110086917877197, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.6306499242782593, + "train/total_loss": 1.1004109382629395 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.220631942152977, - "train/contrastive_loss": 1.9464044570922852, - "train/negative_loss": 1.8838516473770142, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.06255282461643219, - "train/total_loss": 0.6099128127098083 + "train/classification_loss": 0.2047160267829895, + "train/contrastive_loss": 3.0547940731048584, + "train/negative_loss": 1.8693389892578125, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.185455083847046, + "train/total_loss": 0.8156748414039612 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24497845768928528, - "train/contrastive_loss": 1.1590956449508667, - "train/negative_loss": 1.1042920351028442, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.05480358749628067, - "train/total_loss": 0.47679758071899414 + "train/classification_loss": 0.28234678506851196, + "train/contrastive_loss": 2.6560606956481934, + "train/negative_loss": 2.1974549293518066, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.4586058557033539, + "train/total_loss": 0.8135589361190796 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.29513853788375854, - "train/contrastive_loss": 2.2196333408355713, - "train/negative_loss": 1.7997887134552002, - "train/num_negatives": 40, + "train/classification_loss": 0.2614976763725281, + "train/contrastive_loss": 1.7249749898910522, + "train/negative_loss": 1.6987032890319824, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.4198446571826935, - "train/total_loss": 0.7390651702880859 + "train/positive_loss": 0.02627166360616684, + "train/total_loss": 0.6064926385879517 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.31698620319366455, - "train/contrastive_loss": 1.467206358909607, - "train/negative_loss": 1.0750025510787964, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.39220380783081055, - "train/total_loss": 0.6104274988174438 + "train/classification_loss": 0.272960901260376, + "train/contrastive_loss": 2.9053120613098145, + "train/negative_loss": 1.705049991607666, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.200262188911438, + "train/total_loss": 0.8540233373641968 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.30684995651245117, - "train/contrastive_loss": 1.879387617111206, - "train/negative_loss": 1.8716548681259155, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.00773277971893549, - "train/total_loss": 0.6827274560928345 + "train/classification_loss": 0.30305367708206177, + "train/contrastive_loss": 1.5640089511871338, + "train/negative_loss": 1.4782166481018066, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.08579232543706894, + "train/total_loss": 0.6158554553985596 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24463358521461487, - "train/contrastive_loss": 2.313711643218994, - "train/negative_loss": 2.1724820137023926, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.14122968912124634, - "train/total_loss": 0.7073758840560913 + "train/classification_loss": 0.23551839590072632, + "train/contrastive_loss": 2.1996805667877197, + "train/negative_loss": 1.8477649688720703, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.35191550850868225, + "train/total_loss": 0.6754544973373413 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3067975640296936, - "train/contrastive_loss": 3.284423351287842, - "train/negative_loss": 1.8870248794555664, - "train/num_negatives": 44, + "train/classification_loss": 0.23813864588737488, + "train/contrastive_loss": 1.5576269626617432, + "train/negative_loss": 1.4352878332138062, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.397398591041565, - "train/total_loss": 0.963682234287262 + "train/positive_loss": 0.12233909219503403, + "train/total_loss": 0.5496640205383301 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.319360613822937, - "train/contrastive_loss": 2.3497543334960938, - "train/negative_loss": 2.2107105255126953, - "train/num_negatives": 44, + "train/classification_loss": 0.2204272598028183, + "train/contrastive_loss": 2.505669355392456, + "train/negative_loss": 1.9168288707733154, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.13904379308223724, - "train/total_loss": 0.7893115282058716 + "train/positive_loss": 0.5888404846191406, + "train/total_loss": 0.7215611338615417 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.23326444625854492, - "train/contrastive_loss": 1.3863937854766846, - "train/negative_loss": 1.2021559476852417, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.18423783779144287, - "train/total_loss": 0.5105432271957397 + "train/classification_loss": 0.28241947293281555, + "train/contrastive_loss": 2.472677230834961, + "train/negative_loss": 1.5921576023101807, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.8805195689201355, + "train/total_loss": 0.7769548892974854 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.22244426608085632, - "train/contrastive_loss": 1.3176202774047852, - "train/negative_loss": 0.7938833236694336, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.5237370133399963, - "train/total_loss": 0.48596832156181335 + "train/classification_loss": 0.2984713912010193, + "train/contrastive_loss": 2.957724094390869, + "train/negative_loss": 1.658460021018982, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.2992639541625977, + "train/total_loss": 0.8900161981582642 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2026320844888687, - "train/contrastive_loss": 2.213942289352417, - "train/negative_loss": 2.196601152420044, + "train/classification_loss": 0.28209152817726135, + "train/contrastive_loss": 2.216071605682373, + "train/negative_loss": 1.2685127258300781, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.017341088503599167, - "train/total_loss": 0.6454205513000488 + "train/num_positives": 10, + "train/positive_loss": 0.9475589990615845, + "train/total_loss": 0.7253058552742004 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3040400743484497, - "train/contrastive_loss": 1.3410011529922485, - "train/negative_loss": 0.37236323952674866, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9686379432678223, - "train/total_loss": 0.5722403526306152 + "train/classification_loss": 0.26708120107650757, + "train/contrastive_loss": 3.642721176147461, + "train/negative_loss": 2.2846689224243164, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3580522537231445, + "train/total_loss": 0.9956254363059998 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.28776150941848755, - "train/contrastive_loss": 1.641850233078003, - "train/negative_loss": 1.6310104131698608, + "train/classification_loss": 0.2888607680797577, + "train/contrastive_loss": 1.6935940980911255, + "train/negative_loss": 1.6417105197906494, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.010839840397238731, - "train/total_loss": 0.6161315441131592 + "train/num_positives": 4, + "train/positive_loss": 0.051883574575185776, + "train/total_loss": 0.6275795698165894 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2818530201911926, - "train/contrastive_loss": 2.272491693496704, - "train/negative_loss": 2.1244754791259766, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.14801615476608276, - "train/total_loss": 0.7363513708114624 + "train/classification_loss": 0.2867181599140167, + "train/contrastive_loss": 0.2821022868156433, + "train/negative_loss": 0.24514326453208923, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.03695903345942497, + "train/total_loss": 0.34313860535621643 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2864355742931366, - "train/contrastive_loss": 1.2537990808486938, - "train/negative_loss": 1.2483224868774414, - "train/num_negatives": 40, + "train/classification_loss": 0.2716374397277832, + "train/contrastive_loss": 4.49190616607666, + "train/negative_loss": 2.18587064743042, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.005476551130414009, - "train/total_loss": 0.5371953845024109 + "train/positive_loss": 2.3060357570648193, + "train/total_loss": 1.1700186729431152 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3028380572795868, - "train/contrastive_loss": 2.998008966445923, - "train/negative_loss": 2.3175406455993652, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.6804683208465576, - "train/total_loss": 0.9024398326873779 + "train/classification_loss": 0.3197396695613861, + "train/contrastive_loss": 1.5733642578125, + "train/negative_loss": 0.9986933469772339, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.5746709704399109, + "train/total_loss": 0.6344125270843506 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2790559232234955, - "train/contrastive_loss": 2.0663206577301025, - "train/negative_loss": 1.4832245111465454, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5830960869789124, - "train/total_loss": 0.6923200488090515 + "train/classification_loss": 0.23270614445209503, + "train/contrastive_loss": 1.7262274026870728, + "train/negative_loss": 1.7245793342590332, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0016481271013617516, + "train/total_loss": 0.5779516100883484 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2718316912651062, - "train/contrastive_loss": 3.0426084995269775, - "train/negative_loss": 2.6247479915618896, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.4178604483604431, - "train/total_loss": 0.8803533911705017 + "train/classification_loss": 0.2607567608356476, + "train/contrastive_loss": 5.528561592102051, + "train/negative_loss": 2.7974326610565186, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.7311289310455322, + "train/total_loss": 1.3664690256118774 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3339521884918213, - "train/contrastive_loss": 1.418155550956726, - "train/negative_loss": 1.415216088294983, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0029394275043159723, - "train/total_loss": 0.6175832748413086 + "train/classification_loss": 0.27459150552749634, + "train/contrastive_loss": 3.4055511951446533, + "train/negative_loss": 2.3855397701263428, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.0200114250183105, + "train/total_loss": 0.9557017683982849 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.290495365858078, - "train/contrastive_loss": 2.517930507659912, - "train/negative_loss": 2.3389174938201904, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.17901305854320526, - "train/total_loss": 0.794081449508667 + "train/classification_loss": 0.28914380073547363, + "train/contrastive_loss": 1.8177766799926758, + "train/negative_loss": 1.659364104270935, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.15841253101825714, + "train/total_loss": 0.6526991128921509 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26782140135765076, - "train/contrastive_loss": 3.9957876205444336, - "train/negative_loss": 2.761676073074341, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.2341114282608032, - "train/total_loss": 1.066978931427002 + "train/classification_loss": 0.31958192586898804, + "train/contrastive_loss": 3.929149627685547, + "train/negative_loss": 2.4659814834594727, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.4631681442260742, + "train/total_loss": 1.1054118871688843 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24464349448680878, - "train/contrastive_loss": 4.319703578948975, - "train/negative_loss": 2.3003790378570557, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.019324541091919, - "train/total_loss": 1.1085841655731201 + "train/classification_loss": 0.2196313440799713, + "train/contrastive_loss": 3.1857128143310547, + "train/negative_loss": 2.962709426879883, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.22300350666046143, + "train/total_loss": 0.8567739725112915 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26179882884025574, - "train/contrastive_loss": 3.0299952030181885, - "train/negative_loss": 2.8075833320617676, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.2224118411540985, - "train/total_loss": 0.8677978515625 + "train/classification_loss": 0.28469201922416687, + "train/contrastive_loss": 2.296447992324829, + "train/negative_loss": 1.8910917043685913, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.40535634756088257, + "train/total_loss": 0.7439815998077393 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2511751055717468, - "train/contrastive_loss": 2.128631353378296, - "train/negative_loss": 1.8583238124847412, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.2703075110912323, - "train/total_loss": 0.6769013404846191 + "train/classification_loss": 0.3504771292209625, + "train/contrastive_loss": 4.495262145996094, + "train/negative_loss": 4.488855838775635, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0064062997698783875, + "train/total_loss": 1.2495296001434326 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2915743291378021, - "train/contrastive_loss": 2.020571231842041, - "train/negative_loss": 2.0020830631256104, - "train/num_negatives": 46, + "train/classification_loss": 0.27917760610580444, + "train/contrastive_loss": 1.010267734527588, + "train/negative_loss": 0.7466593980789185, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.26360830664634705, + "train/total_loss": 0.481231153011322 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.3012574315071106, + "train/contrastive_loss": 4.016504287719727, + "train/negative_loss": 2.8275396823883057, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.018488101661205292, - "train/total_loss": 0.6956886053085327 + "train/positive_loss": 1.18896484375, + "train/total_loss": 1.1045582294464111 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26607683300971985, - "train/contrastive_loss": 2.520843744277954, - "train/negative_loss": 2.5175375938415527, + "train/classification_loss": 0.2221851497888565, + "train/contrastive_loss": 1.6562566757202148, + "train/negative_loss": 1.2890082597732544, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0033060661517083645, - "train/total_loss": 0.7702455520629883 + "train/num_positives": 10, + "train/positive_loss": 0.36724844574928284, + "train/total_loss": 0.5534365177154541 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.24506540596485138, + "train/contrastive_loss": 5.210491180419922, + "train/negative_loss": 3.3771255016326904, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.8333656787872314, + "train/total_loss": 1.2871637344360352 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2455340325832367, - "train/contrastive_loss": 1.443027377128601, - "train/negative_loss": 1.418811559677124, + "train/classification_loss": 0.3047761023044586, + "train/contrastive_loss": 1.3365381956100464, + "train/negative_loss": 1.3220471143722534, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.01449110172688961, + "train/total_loss": 0.5720837116241455 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.2840941548347473, + "train/contrastive_loss": 2.062333345413208, + "train/negative_loss": 2.056055784225464, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.02421583980321884, - "train/total_loss": 0.5341395139694214 + "train/positive_loss": 0.0062774671241641045, + "train/total_loss": 0.6965608596801758 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2530542016029358, - "train/contrastive_loss": 2.1591179370880127, - "train/negative_loss": 2.1420891284942627, - "train/num_negatives": 36, + "train/classification_loss": 0.28721535205841064, + "train/contrastive_loss": 1.5204625129699707, + "train/negative_loss": 1.4459203481674194, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.07454212009906769, + "train/total_loss": 0.5913078784942627 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.33346113562583923, + "train/contrastive_loss": 3.6520848274230957, + "train/negative_loss": 3.217862844467163, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.01702870801091194, - "train/total_loss": 0.6848777532577515 + "train/positive_loss": 0.43422210216522217, + "train/total_loss": 1.063878059387207 + }, + { + "epoch": 1.76056338028169, + "step": 500, + "train/classification_loss": 0.25263580679893494, + "train/contrastive_loss": 4.213356971740723, + "train/negative_loss": 1.8085908889770508, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.404766321182251, + "train/total_loss": 1.0953072309494019 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3019786477088928, - "train/contrastive_loss": 1.8163037300109863, - "train/negative_loss": 1.6808263063430786, + "train/classification_loss": 0.27537038922309875, + "train/contrastive_loss": 1.8133575916290283, + "train/negative_loss": 1.4918739795684814, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.1354774385690689, - "train/total_loss": 0.6652393937110901 + "train/num_positives": 14, + "train/positive_loss": 0.3214835524559021, + "train/total_loss": 0.6380419135093689 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24629688262939453, - "train/contrastive_loss": 2.1531715393066406, - "train/negative_loss": 1.9413652420043945, + "train/classification_loss": 0.31176668405532837, + "train/contrastive_loss": 2.0695607662200928, + "train/negative_loss": 2.0549192428588867, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.21180641651153564, - "train/total_loss": 0.6769312024116516 + "train/num_positives": 2, + "train/positive_loss": 0.01464143581688404, + "train/total_loss": 0.7256788015365601 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2410711944103241, - "train/contrastive_loss": 1.6536691188812256, - "train/negative_loss": 1.2662653923034668, + "train/classification_loss": 0.2532116770744324, + "train/contrastive_loss": 2.148019790649414, + "train/negative_loss": 1.1890658140182495, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.387403666973114, - "train/total_loss": 0.5718050003051758 + "train/num_positives": 16, + "train/positive_loss": 0.958953857421875, + "train/total_loss": 0.682815670967102 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.333817720413208, - "train/contrastive_loss": 2.4586942195892334, - "train/negative_loss": 1.9033467769622803, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.5553474426269531, - "train/total_loss": 0.8255565762519836 + "train/classification_loss": 0.30827730894088745, + "train/contrastive_loss": 2.331303358078003, + "train/negative_loss": 2.268155813217163, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.06314753741025925, + "train/total_loss": 0.774537980556488 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.23226286470890045, - "train/contrastive_loss": 1.9567073583602905, - "train/negative_loss": 1.9541723728179932, - "train/num_negatives": 48, + "train/classification_loss": 0.31441375613212585, + "train/contrastive_loss": 1.7953717708587646, + "train/negative_loss": 1.6414676904678345, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0025349720381200314, - "train/total_loss": 0.6236043572425842 + "train/positive_loss": 0.1539040207862854, + "train/total_loss": 0.6734881401062012 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26705190539360046, - "train/contrastive_loss": 0.6753894686698914, - "train/negative_loss": 0.6321234703063965, + "train/classification_loss": 0.2828734219074249, + "train/contrastive_loss": 1.2499476671218872, + "train/negative_loss": 1.1132442951202393, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.04326602444052696, - "train/total_loss": 0.40212979912757874 + "train/num_positives": 14, + "train/positive_loss": 0.13670335710048676, + "train/total_loss": 0.5328629612922668 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2437479943037033, - "train/contrastive_loss": 1.8337740898132324, - "train/negative_loss": 1.7220194339752197, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1117546334862709, - "train/total_loss": 0.6105028390884399 + "train/classification_loss": 0.35744303464889526, + "train/contrastive_loss": 2.8758091926574707, + "train/negative_loss": 2.5653278827667236, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.31048136949539185, + "train/total_loss": 0.9326049089431763 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.31455138325691223, - "train/contrastive_loss": 0.6476645469665527, - "train/negative_loss": 0.5985459089279175, - "train/num_negatives": 28, + "train/classification_loss": 0.23784872889518738, + "train/contrastive_loss": 1.8612314462661743, + "train/negative_loss": 1.859705924987793, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.04911866411566734, - "train/total_loss": 0.4440842866897583 + "train/positive_loss": 0.0015254702884703875, + "train/total_loss": 0.6100950241088867 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.277453750371933, - "train/contrastive_loss": 2.4395499229431152, - "train/negative_loss": 1.920211672782898, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5193381905555725, - "train/total_loss": 0.7653637528419495 + "train/classification_loss": 0.24389959871768951, + "train/contrastive_loss": 1.5987324714660645, + "train/negative_loss": 0.9607344269752502, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.6379980444908142, + "train/total_loss": 0.5636460781097412 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2492220252752304, - "train/contrastive_loss": 2.217311382293701, - "train/negative_loss": 2.2122128009796143, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.005098478402942419, - "train/total_loss": 0.6926842927932739 + "train/classification_loss": 0.2681601643562317, + "train/contrastive_loss": 2.4863693714141846, + "train/negative_loss": 2.1036064624786377, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3827628493309021, + "train/total_loss": 0.7654340267181396 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26092731952667236, - "train/contrastive_loss": 2.329272508621216, - "train/negative_loss": 1.2097499370574951, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1195225715637207, - "train/total_loss": 0.7267818450927734 + "train/classification_loss": 0.28281816840171814, + "train/contrastive_loss": 4.531801223754883, + "train/negative_loss": 2.6227142810821533, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.909087061882019, + "train/total_loss": 1.189178466796875 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2740970253944397, - "train/contrastive_loss": 3.4188127517700195, - "train/negative_loss": 2.8697423934936523, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5490702390670776, - "train/total_loss": 0.9578595757484436 + "train/classification_loss": 0.2909647524356842, + "train/contrastive_loss": 2.298614501953125, + "train/negative_loss": 1.843584418296814, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.4550301432609558, + "train/total_loss": 0.7506876587867737 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2725520133972168, - "train/contrastive_loss": 2.088278293609619, - "train/negative_loss": 1.3867937326431274, + "train/classification_loss": 0.25383731722831726, + "train/contrastive_loss": 0.5181118845939636, + "train/negative_loss": 0.4596084654331207, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.7014846205711365, - "train/total_loss": 0.6902077198028564 + "train/num_positives": 16, + "train/positive_loss": 0.058503407984972, + "train/total_loss": 0.35745969414711 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.24089549481868744, - "train/contrastive_loss": 3.4256019592285156, - "train/negative_loss": 3.251102924346924, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.17449894547462463, - "train/total_loss": 0.9260159134864807 + "train/classification_loss": 0.27694326639175415, + "train/contrastive_loss": 2.7504169940948486, + "train/negative_loss": 1.8726387023925781, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.8777782320976257, + "train/total_loss": 0.8270266652107239 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3086997866630554, - "train/contrastive_loss": 3.256136417388916, - "train/negative_loss": 2.1127631664276123, + "train/classification_loss": 0.29925021529197693, + "train/contrastive_loss": 2.403785467147827, + "train/negative_loss": 2.342350959777832, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.1433732509613037, - "train/total_loss": 0.9599270820617676 + "train/num_positives": 2, + "train/positive_loss": 0.061434555798769, + "train/total_loss": 0.7800073027610779 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26777952909469604, - "train/contrastive_loss": 2.9351818561553955, - "train/negative_loss": 2.9260306358337402, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.00915125384926796, - "train/total_loss": 0.8548159003257751 + "train/classification_loss": 0.23116818070411682, + "train/contrastive_loss": 1.8308014869689941, + "train/negative_loss": 1.4933220148086548, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.33747944235801697, + "train/total_loss": 0.5973284840583801 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.23266853392124176, - "train/contrastive_loss": 2.309629440307617, - "train/negative_loss": 1.964940071105957, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.3446894586086273, - "train/total_loss": 0.6945944428443909 + "train/classification_loss": 0.27349355816841125, + "train/contrastive_loss": 2.776144504547119, + "train/negative_loss": 2.7390992641448975, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0370451882481575, + "train/total_loss": 0.8287224769592285 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2580176889896393, - "train/contrastive_loss": 2.5884251594543457, - "train/negative_loss": 2.012775421142578, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5756496787071228, - "train/total_loss": 0.775702714920044 + "train/classification_loss": 0.3065961003303528, + "train/contrastive_loss": 3.2309837341308594, + "train/negative_loss": 1.5713709592819214, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.6596126556396484, + "train/total_loss": 0.9527928829193115 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2785678803920746, - "train/contrastive_loss": 4.601867198944092, - "train/negative_loss": 4.209553241729736, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.39231374859809875, - "train/total_loss": 1.1989413499832153 + "train/classification_loss": 0.2666000425815582, + "train/contrastive_loss": 3.2088193893432617, + "train/negative_loss": 3.2054524421691895, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0033669769763946533, + "train/total_loss": 0.908363938331604 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2743292450904846, - "train/contrastive_loss": 3.424619197845459, - "train/negative_loss": 2.656193971633911, + "train/classification_loss": 0.2936076521873474, + "train/contrastive_loss": 1.6566014289855957, + "train/negative_loss": 1.557382345199585, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.7684252858161926, - "train/total_loss": 0.9592530727386475 + "train/positive_loss": 0.09921909123659134, + "train/total_loss": 0.6249279379844666 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.2724975645542145, - "train/contrastive_loss": 1.032958984375, - "train/negative_loss": 1.0323991775512695, + "train/classification_loss": 0.2817278504371643, + "train/contrastive_loss": 2.2113726139068604, + "train/negative_loss": 2.1751155853271484, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0005598097341135144, - "train/total_loss": 0.4790893793106079 + "train/num_positives": 8, + "train/positive_loss": 0.03625708073377609, + "train/total_loss": 0.7240023612976074 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.23517067730426788, - "train/contrastive_loss": 2.9819934368133545, - "train/negative_loss": 2.9269683361053467, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.055025044828653336, - "train/total_loss": 0.8315693736076355 + "train/classification_loss": 0.228508859872818, + "train/contrastive_loss": 2.889946460723877, + "train/negative_loss": 2.2652790546417236, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.6246672868728638, + "train/total_loss": 0.8064981698989868 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.27856242656707764, - "train/contrastive_loss": 2.264885902404785, - "train/negative_loss": 2.2433114051818848, - "train/num_negatives": 46, + "train/classification_loss": 0.30241695046424866, + "train/contrastive_loss": 2.6104650497436523, + "train/negative_loss": 1.6172579526901245, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.021574577316641808, - "train/total_loss": 0.7315396070480347 + "train/positive_loss": 0.9932072162628174, + "train/total_loss": 0.8245099782943726 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3237121105194092, - "train/contrastive_loss": 2.1508140563964844, - "train/negative_loss": 2.1508140563964844, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.7538748979568481 - }, - { - "epoch": 1.9011406844106464, - "eval_exact_match_accuracy": 0.045714285714285714, - "eval_hamming_loss": 0.0915406162464986, - "eval_loss": 0.7327830791473389, - "eval_macro_f1": 0.027115678985348786, - "eval_macro_precision": 0.058823529411764705, - "eval_macro_recall": 0.017618641659562374, - "eval_micro_f1": 0.13177470775770456, - "eval_micro_precision": 1.0, - "eval_micro_recall": 0.07053469852104664, - "eval_runtime": 2.6258, - "eval_samples_per_second": 199.941, - "eval_steps_per_second": 25.135, + "train/classification_loss": 0.3064451217651367, + "train/contrastive_loss": 2.2361652851104736, + "train/negative_loss": 1.6052446365356445, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.6309205889701843, + "train/total_loss": 0.7536782026290894 + }, + { + "epoch": 1.76056338028169, + "eval_exact_match_accuracy": 0.03527336860670194, + "eval_hamming_loss": 0.09295570079883805, + "eval_loss": 0.7930232286453247, + "eval_macro_f1": 0.02187651920272241, + "eval_macro_precision": 0.05514705882352941, + "eval_macro_recall": 0.01364463311097635, + "eval_micro_f1": 0.09127789046653144, + "eval_micro_precision": 0.9375, + "eval_micro_recall": 0.04797441364605544, + "eval_runtime": 2.8414, + "eval_samples_per_second": 199.548, + "eval_steps_per_second": 24.987, "step": 500 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.3045381009578705, - "train/contrastive_loss": 0.7964693307876587, - "train/negative_loss": 0.7736365795135498, - "train/num_negatives": 38, - "train/num_positives": 4, - "train/positive_loss": 0.02283276431262493, - "train/total_loss": 0.46383196115493774 + "train/classification_loss": 0.272177129983902, + "train/contrastive_loss": 1.6633307933807373, + "train/negative_loss": 1.0278187990188599, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.6355120539665222, + "train/total_loss": 0.604843258857727 }, { - "epoch": 1.9011406844106464, + "epoch": 1.76056338028169, "step": 500, - "train/classification_loss": 0.26485320925712585, - "train/contrastive_loss": 1.7239432334899902, - "train/negative_loss": 0.9590576887130737, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.7648855447769165, - "train/total_loss": 0.6096418499946594 + "train/classification_loss": 0.2887512147426605, + "train/contrastive_loss": 1.1888062953948975, + "train/negative_loss": 0.9608774185180664, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.22792884707450867, + "train/total_loss": 0.5265125036239624 }, { - "epoch": 2.091254752851711, - "grad_norm": 16.867555618286133, - "learning_rate": 1.993196347031964e-05, - "loss": 1.158, + "epoch": 1.936619718309859, + "grad_norm": 19.463146209716797, + "learning_rate": 1.9937138830162087e-05, + "loss": 1.1723, "step": 550 }, { - "epoch": 2.091254752851711, + "epoch": 1.936619718309859, "step": 550, - "train/classification_loss": 0.2603025436401367, - "train/contrastive_loss": 1.8860293626785278, - "train/negative_loss": 1.766381025314331, - "train/num_negatives": 24, - "train/num_positives": 20, - "train/positive_loss": 0.11964833736419678, - "train/total_loss": 0.6375083923339844 + "train/classification_loss": 0.26050716638565063, + "train/contrastive_loss": 1.7977603673934937, + "train/negative_loss": 1.2410331964492798, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.5567271709442139, + "train/total_loss": 0.6200592517852783 }, { - "epoch": 2.091254752851711, + "epoch": 1.936619718309859, "step": 550, - "train/classification_loss": 0.30722472071647644, - "train/contrastive_loss": 1.5574275255203247, - "train/negative_loss": 1.4822114706039429, - "train/num_negatives": 32, - "train/num_positives": 14, - "train/positive_loss": 0.07521605491638184, - "train/total_loss": 0.6187102198600769 + "train/classification_loss": 0.27938032150268555, + "train/contrastive_loss": 1.2287302017211914, + "train/negative_loss": 1.056685209274292, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.17204496264457703, + "train/total_loss": 0.5251263380050659 }, { - "epoch": 2.2813688212927756, - "grad_norm": 13.106066703796387, - "learning_rate": 1.9924353120243533e-05, - "loss": 1.0938, + "epoch": 2.112676056338028, + "grad_norm": 13.017983436584473, + "learning_rate": 1.9930091613812545e-05, + "loss": 1.1545, "step": 600 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.3053629398345947, - "train/contrastive_loss": 2.0965709686279297, - "train/negative_loss": 1.6168806552886963, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.4796903729438782, - "train/total_loss": 0.7246771454811096 + "train/classification_loss": 0.2655118405818939, + "train/contrastive_loss": 2.7165048122406006, + "train/negative_loss": 2.4909591674804688, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.2255457192659378, + "train/total_loss": 0.8088128566741943 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2780905067920685, - "train/contrastive_loss": 3.795358180999756, - "train/negative_loss": 1.9760562181472778, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.819301962852478, - "train/total_loss": 1.037162184715271 + "train/classification_loss": 0.35418999195098877, + "train/contrastive_loss": 1.7897865772247314, + "train/negative_loss": 1.7852965593338013, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.004490070044994354, + "train/total_loss": 0.7121473550796509 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23761163651943207, - "train/contrastive_loss": 2.3671178817749023, - "train/negative_loss": 0.8812187314033508, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.4858992099761963, - "train/total_loss": 0.7110351920127869 + "train/classification_loss": 0.2882835566997528, + "train/contrastive_loss": 3.125886917114258, + "train/negative_loss": 2.148383617401123, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9775032997131348, + "train/total_loss": 0.9134609699249268 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.24044281244277954, - "train/contrastive_loss": 3.2543113231658936, - "train/negative_loss": 2.429713249206543, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.8245981335639954, - "train/total_loss": 0.8913050889968872 + "train/classification_loss": 0.2018880397081375, + "train/contrastive_loss": 2.4460976123809814, + "train/negative_loss": 2.344330310821533, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.10176732391119003, + "train/total_loss": 0.6911075711250305 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.27325311303138733, - "train/contrastive_loss": 2.117338180541992, - "train/negative_loss": 1.9147635698318481, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.20257455110549927, - "train/total_loss": 0.6967207193374634 + "train/classification_loss": 0.262895405292511, + "train/contrastive_loss": 3.8667688369750977, + "train/negative_loss": 3.8429808616638184, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.023787880316376686, + "train/total_loss": 1.0362491607666016 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.26346445083618164, - "train/contrastive_loss": 1.7167760133743286, - "train/negative_loss": 1.5592583417892456, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.1575176864862442, - "train/total_loss": 0.6068196296691895 + "train/classification_loss": 0.27121493220329285, + "train/contrastive_loss": 3.6091127395629883, + "train/negative_loss": 2.9608404636383057, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6482722759246826, + "train/total_loss": 0.9930374622344971 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.3129427433013916, - "train/contrastive_loss": 2.6253774166107178, - "train/negative_loss": 2.0711331367492676, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.5542442798614502, - "train/total_loss": 0.8380182385444641 + "train/classification_loss": 0.25528448820114136, + "train/contrastive_loss": 2.0596120357513428, + "train/negative_loss": 1.8073989152908325, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.25221318006515503, + "train/total_loss": 0.667206883430481 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2176736742258072, - "train/contrastive_loss": 2.1931509971618652, - "train/negative_loss": 1.4539037942886353, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7392470836639404, - "train/total_loss": 0.656303882598877 + "train/classification_loss": 0.29203322529792786, + "train/contrastive_loss": 1.5734552145004272, + "train/negative_loss": 1.573405385017395, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 4.983072358299978e-05, + "train/total_loss": 0.6067242622375488 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22842015326023102, - "train/contrastive_loss": 1.916088342666626, - "train/negative_loss": 1.8641259670257568, + "train/classification_loss": 0.2447809875011444, + "train/contrastive_loss": 1.3014971017837524, + "train/negative_loss": 1.2134637832641602, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.05196234583854675, - "train/total_loss": 0.6116378307342529 + "train/positive_loss": 0.08803336322307587, + "train/total_loss": 0.5050804018974304 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.32319962978363037, - "train/contrastive_loss": 3.6255459785461426, - "train/negative_loss": 2.826795816421509, + "train/classification_loss": 0.28763678669929504, + "train/contrastive_loss": 3.355006694793701, + "train/negative_loss": 2.41642165184021, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7987500429153442, - "train/total_loss": 1.0483088493347168 + "train/num_positives": 14, + "train/positive_loss": 0.9385851621627808, + "train/total_loss": 0.9586381912231445 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2530325651168823, - "train/contrastive_loss": 1.861983299255371, - "train/negative_loss": 1.6803133487701416, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.18166998028755188, - "train/total_loss": 0.6254292726516724 + "train/classification_loss": 0.24386745691299438, + "train/contrastive_loss": 1.6079519987106323, + "train/negative_loss": 1.6015613079071045, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.006390690803527832, + "train/total_loss": 0.565457820892334 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22002524137496948, - "train/contrastive_loss": 1.791921615600586, - "train/negative_loss": 1.2439730167388916, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.5479485988616943, - "train/total_loss": 0.5784095525741577 + "train/classification_loss": 0.27382519841194153, + "train/contrastive_loss": 2.1843647956848145, + "train/negative_loss": 2.135948657989502, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.048416100442409515, + "train/total_loss": 0.710698127746582 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.276313841342926, - "train/contrastive_loss": 3.3962888717651367, - "train/negative_loss": 3.166245698928833, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.23004305362701416, - "train/total_loss": 0.9555716514587402 + "train/classification_loss": 0.27145224809646606, + "train/contrastive_loss": 5.196383476257324, + "train/negative_loss": 4.228582382202148, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9678012132644653, + "train/total_loss": 1.3107290267944336 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23602746427059174, - "train/contrastive_loss": 1.8867781162261963, - "train/negative_loss": 1.8650411367416382, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.021737001836299896, - "train/total_loss": 0.6133831143379211 + "train/classification_loss": 0.307817280292511, + "train/contrastive_loss": 1.743464708328247, + "train/negative_loss": 1.4246816635131836, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.31878307461738586, + "train/total_loss": 0.6565102338790894 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2137341946363449, - "train/contrastive_loss": 1.9745721817016602, - "train/negative_loss": 1.550823450088501, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.42374879121780396, - "train/total_loss": 0.6086486577987671 + "train/classification_loss": 0.19442690908908844, + "train/contrastive_loss": 2.4461112022399902, + "train/negative_loss": 1.6319011449813843, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8142101168632507, + "train/total_loss": 0.6836491823196411 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23502852022647858, - "train/contrastive_loss": 1.2561421394348145, - "train/negative_loss": 1.2300574779510498, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.02608466148376465, - "train/total_loss": 0.4862569570541382 + "train/classification_loss": 0.27335432171821594, + "train/contrastive_loss": 2.657935380935669, + "train/negative_loss": 2.2297253608703613, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.42820996046066284, + "train/total_loss": 0.8049414157867432 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2901841104030609, - "train/contrastive_loss": 2.6934168338775635, - "train/negative_loss": 2.584892749786377, - "train/num_negatives": 40, + "train/classification_loss": 0.24967409670352936, + "train/contrastive_loss": 2.3317456245422363, + "train/negative_loss": 2.2358877658843994, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.10852408409118652, - "train/total_loss": 0.8288674354553223 + "train/positive_loss": 0.09585781395435333, + "train/total_loss": 0.7160232067108154 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.3048149645328522, - "train/contrastive_loss": 1.1874828338623047, - "train/negative_loss": 0.8815872073173523, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.30589559674263, - "train/total_loss": 0.5423115491867065 + "train/classification_loss": 0.26585885882377625, + "train/contrastive_loss": 2.33823299407959, + "train/negative_loss": 2.2738454341888428, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.06438751518726349, + "train/total_loss": 0.7335054874420166 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.3013513386249542, - "train/contrastive_loss": 1.564026117324829, - "train/negative_loss": 1.5086508989334106, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.05537520349025726, - "train/total_loss": 0.6141566038131714 + "train/classification_loss": 0.2969436049461365, + "train/contrastive_loss": 2.2686820030212402, + "train/negative_loss": 2.2569010257720947, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.011780895292758942, + "train/total_loss": 0.7506799697875977 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23683418333530426, - "train/contrastive_loss": 4.1694841384887695, - "train/negative_loss": 2.391162633895874, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.7783215045928955, - "train/total_loss": 1.0707310438156128 + "train/classification_loss": 0.22988630831241608, + "train/contrastive_loss": 2.651657819747925, + "train/negative_loss": 2.634925365447998, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.016732439398765564, + "train/total_loss": 0.7602178454399109 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2994956970214844, - "train/contrastive_loss": 3.1649837493896484, - "train/negative_loss": 1.733036756515503, - "train/num_negatives": 44, + "train/classification_loss": 0.22725173830986023, + "train/contrastive_loss": 1.5604908466339111, + "train/negative_loss": 1.3795166015625, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.431947112083435, - "train/total_loss": 0.9324924349784851 + "train/positive_loss": 0.18097421526908875, + "train/total_loss": 0.5393499135971069 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.31914520263671875, - "train/contrastive_loss": 1.9854604005813599, - "train/negative_loss": 1.9291094541549683, - "train/num_negatives": 44, + "train/classification_loss": 0.20920825004577637, + "train/contrastive_loss": 2.2791993618011475, + "train/negative_loss": 2.1695494651794434, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.056350987404584885, - "train/total_loss": 0.7162373065948486 + "train/positive_loss": 0.10964998602867126, + "train/total_loss": 0.6650481224060059 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2258186638355255, - "train/contrastive_loss": 1.5336418151855469, - "train/negative_loss": 1.0968799591064453, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.4367617964744568, - "train/total_loss": 0.5325469970703125 + "train/classification_loss": 0.2731555700302124, + "train/contrastive_loss": 1.913442850112915, + "train/negative_loss": 1.52596116065979, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.3874816298484802, + "train/total_loss": 0.6558441519737244 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.21134836971759796, - "train/contrastive_loss": 1.9585018157958984, - "train/negative_loss": 0.526372492313385, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 1.4321293830871582, - "train/total_loss": 0.6030487418174744 + "train/classification_loss": 0.2883538007736206, + "train/contrastive_loss": 3.0538086891174316, + "train/negative_loss": 2.366272449493408, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.6875361800193787, + "train/total_loss": 0.8991155624389648 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.1950484961271286, - "train/contrastive_loss": 1.9791289567947388, - "train/negative_loss": 1.7946821451187134, + "train/classification_loss": 0.270912766456604, + "train/contrastive_loss": 1.44975745677948, + "train/negative_loss": 1.1361711025238037, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.18444685637950897, - "train/total_loss": 0.5908743143081665 + "train/num_positives": 10, + "train/positive_loss": 0.31358638405799866, + "train/total_loss": 0.560864269733429 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.29755380749702454, - "train/contrastive_loss": 1.2474653720855713, - "train/negative_loss": 0.6533695459365845, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.5940958261489868, - "train/total_loss": 0.5470468997955322 + "train/classification_loss": 0.25922784209251404, + "train/contrastive_loss": 3.3822884559631348, + "train/negative_loss": 2.331347703933716, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0509408712387085, + "train/total_loss": 0.9356855154037476 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.28541430830955505, - "train/contrastive_loss": 1.4362072944641113, - "train/negative_loss": 1.4124847650527954, + "train/classification_loss": 0.2828563153743744, + "train/contrastive_loss": 3.1865062713623047, + "train/negative_loss": 3.0384509563446045, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.02372247353196144, - "train/total_loss": 0.5726557970046997 + "train/num_positives": 4, + "train/positive_loss": 0.14805543422698975, + "train/total_loss": 0.9201575517654419 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2749898433685303, - "train/contrastive_loss": 3.1206021308898926, - "train/negative_loss": 2.45470929145813, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.6658927202224731, - "train/total_loss": 0.8991102576255798 + "train/classification_loss": 0.2778072953224182, + "train/contrastive_loss": 0.8674440383911133, + "train/negative_loss": 0.8614189028739929, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.006025121081620455, + "train/total_loss": 0.4512960910797119 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.27938881516456604, - "train/contrastive_loss": 1.048708438873291, - "train/negative_loss": 1.0295237302780151, - "train/num_negatives": 40, + "train/classification_loss": 0.26533621549606323, + "train/contrastive_loss": 4.989627838134766, + "train/negative_loss": 2.029449224472046, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.019184691831469536, - "train/total_loss": 0.48913049697875977 + "train/positive_loss": 2.960178852081299, + "train/total_loss": 1.2632617950439453 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2943980395793915, - "train/contrastive_loss": 3.343721389770508, - "train/negative_loss": 2.6845617294311523, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.6591595411300659, - "train/total_loss": 0.9631422758102417 + "train/classification_loss": 0.3142849802970886, + "train/contrastive_loss": 2.2525582313537598, + "train/negative_loss": 1.6249645948410034, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.6275936961174011, + "train/total_loss": 0.7647966146469116 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.27157384157180786, - "train/contrastive_loss": 1.7809405326843262, - "train/negative_loss": 0.7537832260131836, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.0271573066711426, - "train/total_loss": 0.627761960029602 + "train/classification_loss": 0.22230415046215057, + "train/contrastive_loss": 2.341874122619629, + "train/negative_loss": 2.341752052307129, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0001221778802573681, + "train/total_loss": 0.6906789541244507 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.266177773475647, - "train/contrastive_loss": 2.832378387451172, - "train/negative_loss": 1.945176362991333, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8872019052505493, - "train/total_loss": 0.8326534628868103 + "train/classification_loss": 0.2520856261253357, + "train/contrastive_loss": 4.726991176605225, + "train/negative_loss": 3.535334825515747, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.191656231880188, + "train/total_loss": 1.1974838972091675 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.329804390668869, - "train/contrastive_loss": 2.3515772819519043, - "train/negative_loss": 2.3417437076568604, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.009833484888076782, - "train/total_loss": 0.8001198768615723 + "train/classification_loss": 0.26316654682159424, + "train/contrastive_loss": 3.1302757263183594, + "train/negative_loss": 2.7062013149261475, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.4240744113922119, + "train/total_loss": 0.889221727848053 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2850727140903473, - "train/contrastive_loss": 2.28651762008667, - "train/negative_loss": 1.3023645877838135, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.984153151512146, - "train/total_loss": 0.7423762083053589 + "train/classification_loss": 0.2838142514228821, + "train/contrastive_loss": 2.1439647674560547, + "train/negative_loss": 1.8014320135116577, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.3425328731536865, + "train/total_loss": 0.712607204914093 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2660292685031891, - "train/contrastive_loss": 3.010007381439209, - "train/negative_loss": 2.070204019546509, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.9398033618927002, - "train/total_loss": 0.8680307865142822 + "train/classification_loss": 0.31727495789527893, + "train/contrastive_loss": 2.5879080295562744, + "train/negative_loss": 1.9560651779174805, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6318427920341492, + "train/total_loss": 0.8348566293716431 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23623742163181305, - "train/contrastive_loss": 3.1034445762634277, - "train/negative_loss": 1.5956696271896362, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.507774829864502, - "train/total_loss": 0.8569263219833374 + "train/classification_loss": 0.20751053094863892, + "train/contrastive_loss": 3.660047769546509, + "train/negative_loss": 3.6077892780303955, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.052258577197790146, + "train/total_loss": 0.9395201206207275 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2530043125152588, - "train/contrastive_loss": 2.295536756515503, - "train/negative_loss": 1.7948848009109497, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5006519556045532, - "train/total_loss": 0.7121117115020752 + "train/classification_loss": 0.27994856238365173, + "train/contrastive_loss": 3.369920492172241, + "train/negative_loss": 2.3817219734191895, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.9881985783576965, + "train/total_loss": 0.9539326429367065 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2467363029718399, - "train/contrastive_loss": 2.233071804046631, - "train/negative_loss": 2.0985190868377686, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.13455261290073395, - "train/total_loss": 0.6933506727218628 + "train/classification_loss": 0.3470801115036011, + "train/contrastive_loss": 3.1829419136047363, + "train/negative_loss": 3.1593027114868164, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.023639317601919174, + "train/total_loss": 0.9836685061454773 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2885199785232544, - "train/contrastive_loss": 2.1732215881347656, - "train/negative_loss": 1.7702298164367676, - "train/num_negatives": 46, + "train/classification_loss": 0.2744625210762024, + "train/contrastive_loss": 0.7977559566497803, + "train/negative_loss": 0.795982301235199, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.001773629686795175, + "train/total_loss": 0.4340137243270874 + }, + { + "epoch": 2.112676056338028, + "step": 600, + "train/classification_loss": 0.3006003499031067, + "train/contrastive_loss": 3.7789857387542725, + "train/negative_loss": 2.5526533126831055, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.4029916524887085, - "train/total_loss": 0.7231643199920654 + "train/positive_loss": 1.226332426071167, + "train/total_loss": 1.0563974380493164 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.25913944840431213, - "train/contrastive_loss": 1.5998018980026245, - "train/negative_loss": 1.5948688983917236, + "train/classification_loss": 0.2159285992383957, + "train/contrastive_loss": 2.106112241744995, + "train/negative_loss": 1.4221737384796143, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.004932987503707409, - "train/total_loss": 0.5790998339653015 + "train/num_positives": 10, + "train/positive_loss": 0.6839384436607361, + "train/total_loss": 0.6371510624885559 + }, + { + "epoch": 2.112676056338028, + "step": 600, + "train/classification_loss": 0.2355670928955078, + "train/contrastive_loss": 3.8951456546783447, + "train/negative_loss": 3.606135129928589, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.2890104651451111, + "train/total_loss": 1.0145962238311768 + }, + { + "epoch": 2.112676056338028, + "step": 600, + "train/classification_loss": 0.2983419895172119, + "train/contrastive_loss": 1.8662009239196777, + "train/negative_loss": 1.8543726205825806, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.011828357353806496, + "train/total_loss": 0.6715822219848633 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2402821183204651, - "train/contrastive_loss": 1.5644036531448364, - "train/negative_loss": 1.4312664270401, + "train/classification_loss": 0.2829849421977997, + "train/contrastive_loss": 2.2853145599365234, + "train/negative_loss": 2.2846763134002686, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.13313724100589752, - "train/total_loss": 0.5531628131866455 + "train/positive_loss": 0.0006382851861417294, + "train/total_loss": 0.7400478720664978 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.24936185777187347, - "train/contrastive_loss": 1.3789221048355103, - "train/negative_loss": 1.2233389616012573, - "train/num_negatives": 36, + "train/classification_loss": 0.28188222646713257, + "train/contrastive_loss": 2.4789621829986572, + "train/negative_loss": 2.3751132488250732, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.10384893417358398, + "train/total_loss": 0.777674674987793 + }, + { + "epoch": 2.112676056338028, + "step": 600, + "train/classification_loss": 0.3321971893310547, + "train/contrastive_loss": 3.455317497253418, + "train/negative_loss": 1.9387705326080322, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.15558311343193054, - "train/total_loss": 0.5251463055610657 + "train/positive_loss": 1.5165468454360962, + "train/total_loss": 1.0232607126235962 + }, + { + "epoch": 2.112676056338028, + "step": 600, + "train/classification_loss": 0.24286231398582458, + "train/contrastive_loss": 2.267987012863159, + "train/negative_loss": 1.2728211879730225, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9951657652854919, + "train/total_loss": 0.6964597105979919 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.29741355776786804, - "train/contrastive_loss": 2.210082530975342, - "train/negative_loss": 2.0727548599243164, + "train/classification_loss": 0.2671754062175751, + "train/contrastive_loss": 2.7592761516571045, + "train/negative_loss": 2.329969882965088, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.13732758164405823, - "train/total_loss": 0.7394300699234009 + "train/num_positives": 14, + "train/positive_loss": 0.42930617928504944, + "train/total_loss": 0.8190306425094604 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.24243102967739105, - "train/contrastive_loss": 2.094785451889038, - "train/negative_loss": 1.96564519405365, + "train/classification_loss": 0.30591079592704773, + "train/contrastive_loss": 3.1203904151916504, + "train/negative_loss": 3.1192197799682617, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.12914031744003296, - "train/total_loss": 0.661388099193573 + "train/num_positives": 2, + "train/positive_loss": 0.0011705452343448997, + "train/total_loss": 0.9299888610839844 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23425063490867615, - "train/contrastive_loss": 1.4507426023483276, - "train/negative_loss": 1.0783480405807495, + "train/classification_loss": 0.24307727813720703, + "train/contrastive_loss": 3.0907504558563232, + "train/negative_loss": 1.889597773551941, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.3723945915699005, - "train/total_loss": 0.5243991613388062 + "train/num_positives": 16, + "train/positive_loss": 1.2011526823043823, + "train/total_loss": 0.8612273931503296 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.3298943042755127, - "train/contrastive_loss": 1.8840030431747437, - "train/negative_loss": 1.8664450645446777, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.01755799539387226, - "train/total_loss": 0.7066949605941772 + "train/classification_loss": 0.29708796739578247, + "train/contrastive_loss": 3.106224775314331, + "train/negative_loss": 2.2909767627716064, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.8152480125427246, + "train/total_loss": 0.9183329343795776 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22021904587745667, - "train/contrastive_loss": 0.9943985939025879, - "train/negative_loss": 0.9839715957641602, - "train/num_negatives": 48, + "train/classification_loss": 0.3065061569213867, + "train/contrastive_loss": 0.8311124444007874, + "train/negative_loss": 0.8197550773620605, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.010426976718008518, - "train/total_loss": 0.41909876465797424 + "train/positive_loss": 0.01135738380253315, + "train/total_loss": 0.4727286696434021 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2556837201118469, - "train/contrastive_loss": 0.5158775448799133, - "train/negative_loss": 0.49861395359039307, + "train/classification_loss": 0.2737361192703247, + "train/contrastive_loss": 1.6114311218261719, + "train/negative_loss": 1.4044698476791382, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.017263609915971756, - "train/total_loss": 0.35885924100875854 + "train/num_positives": 14, + "train/positive_loss": 0.2069612443447113, + "train/total_loss": 0.596022367477417 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22892405092716217, - "train/contrastive_loss": 1.572402000427246, - "train/negative_loss": 1.4213542938232422, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1510477066040039, - "train/total_loss": 0.5434044599533081 + "train/classification_loss": 0.3517117202281952, + "train/contrastive_loss": 2.13155460357666, + "train/negative_loss": 2.095580577850342, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.03597412258386612, + "train/total_loss": 0.7780226469039917 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.30685675144195557, - "train/contrastive_loss": 0.8786717653274536, - "train/negative_loss": 0.2840949296951294, - "train/num_negatives": 28, + "train/classification_loss": 0.22330208122730255, + "train/contrastive_loss": 1.3648285865783691, + "train/negative_loss": 1.3604246377944946, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.5945768356323242, - "train/total_loss": 0.48259109258651733 + "train/positive_loss": 0.004403931554406881, + "train/total_loss": 0.49626779556274414 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.266742080450058, - "train/contrastive_loss": 2.455535650253296, - "train/negative_loss": 1.562181830406189, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8933538198471069, - "train/total_loss": 0.7578492164611816 + "train/classification_loss": 0.22920459508895874, + "train/contrastive_loss": 1.3932069540023804, + "train/negative_loss": 1.3668732643127441, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.02633371204137802, + "train/total_loss": 0.5078459978103638 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.24250350892543793, - "train/contrastive_loss": 1.333814024925232, - "train/negative_loss": 1.323158860206604, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.010655159130692482, - "train/total_loss": 0.5092663168907166 + "train/classification_loss": 0.25943541526794434, + "train/contrastive_loss": 1.3731660842895508, + "train/negative_loss": 1.3676259517669678, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.00554013391956687, + "train/total_loss": 0.5340686440467834 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2544557750225067, - "train/contrastive_loss": 3.5623092651367188, - "train/negative_loss": 1.285308837890625, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 2.2770004272460938, - "train/total_loss": 0.9669176340103149 + "train/classification_loss": 0.2787546217441559, + "train/contrastive_loss": 3.2431516647338867, + "train/negative_loss": 2.292062997817993, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.9510887265205383, + "train/total_loss": 0.9273849725723267 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2696315348148346, - "train/contrastive_loss": 3.6373393535614014, - "train/negative_loss": 2.9083712100982666, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7289682030677795, - "train/total_loss": 0.9970993995666504 + "train/classification_loss": 0.285135954618454, + "train/contrastive_loss": 2.672668933868408, + "train/negative_loss": 2.601151704788208, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.07151711732149124, + "train/total_loss": 0.8196697235107422 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.26481351256370544, - "train/contrastive_loss": 2.1052334308624268, - "train/negative_loss": 1.3028408288955688, + "train/classification_loss": 0.24279852211475372, + "train/contrastive_loss": 0.33092400431632996, + "train/negative_loss": 0.2881507873535156, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8023926019668579, - "train/total_loss": 0.6858602166175842 + "train/num_positives": 16, + "train/positive_loss": 0.04277321696281433, + "train/total_loss": 0.30898332595825195 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.23258015513420105, - "train/contrastive_loss": 3.282727003097534, - "train/negative_loss": 2.026843547821045, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2558834552764893, - "train/total_loss": 0.8891255855560303 + "train/classification_loss": 0.26458054780960083, + "train/contrastive_loss": 2.991323471069336, + "train/negative_loss": 2.2940022945404053, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.6973210573196411, + "train/total_loss": 0.862845242023468 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.30147460103034973, - "train/contrastive_loss": 2.343031883239746, - "train/negative_loss": 1.5987319946289062, + "train/classification_loss": 0.2952703535556793, + "train/contrastive_loss": 2.254122495651245, + "train/negative_loss": 2.0741899013519287, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.7442998290061951, - "train/total_loss": 0.7700809836387634 + "train/num_positives": 2, + "train/positive_loss": 0.17993269860744476, + "train/total_loss": 0.746094822883606 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2610253691673279, - "train/contrastive_loss": 2.384575605392456, - "train/negative_loss": 2.194462776184082, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.19011281430721283, - "train/total_loss": 0.7379404902458191 + "train/classification_loss": 0.21956709027290344, + "train/contrastive_loss": 2.3346047401428223, + "train/negative_loss": 2.2797367572784424, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.05486806854605675, + "train/total_loss": 0.6864880323410034 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22376032173633575, - "train/contrastive_loss": 2.5066978931427, - "train/negative_loss": 1.6415563821792603, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8651414513587952, - "train/total_loss": 0.7250999212265015 + "train/classification_loss": 0.26317569613456726, + "train/contrastive_loss": 2.884903907775879, + "train/negative_loss": 2.835430860519409, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.04947293549776077, + "train/total_loss": 0.8401564359664917 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.2503180503845215, - "train/contrastive_loss": 1.669156551361084, - "train/negative_loss": 1.4470900297164917, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.2220664769411087, - "train/total_loss": 0.5841493606567383 + "train/classification_loss": 0.2982771098613739, + "train/contrastive_loss": 1.7770580053329468, + "train/negative_loss": 1.4397709369659424, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.337287038564682, + "train/total_loss": 0.6536887288093567 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.26975303888320923, - "train/contrastive_loss": 3.0521397590637207, - "train/negative_loss": 2.459362030029297, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.5927778482437134, - "train/total_loss": 0.8801810145378113 + "train/classification_loss": 0.2596679925918579, + "train/contrastive_loss": 5.190526485443115, + "train/negative_loss": 5.189894199371338, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0006320484098978341, + "train/total_loss": 1.2977733612060547 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.27183014154434204, - "train/contrastive_loss": 2.8167083263397217, - "train/negative_loss": 1.6640963554382324, + "train/classification_loss": 0.2867215573787689, + "train/contrastive_loss": 1.3076599836349487, + "train/negative_loss": 1.1543831825256348, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.1526119709014893, - "train/total_loss": 0.8351718187332153 + "train/positive_loss": 0.15327675640583038, + "train/total_loss": 0.5482535362243652 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.26762473583221436, - "train/contrastive_loss": 1.2457349300384521, - "train/negative_loss": 1.2452888488769531, + "train/classification_loss": 0.27485737204551697, + "train/contrastive_loss": 2.8145785331726074, + "train/negative_loss": 2.7869348526000977, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00044607982272282243, - "train/total_loss": 0.5167717337608337 + "train/num_positives": 8, + "train/positive_loss": 0.027643561363220215, + "train/total_loss": 0.8377730846405029 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.22885167598724365, - "train/contrastive_loss": 2.1733293533325195, - "train/negative_loss": 1.9526170492172241, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.22071237862110138, - "train/total_loss": 0.6635175943374634 + "train/classification_loss": 0.22017274796962738, + "train/contrastive_loss": 2.8017265796661377, + "train/negative_loss": 2.6876823902130127, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.11404415220022202, + "train/total_loss": 0.780518114566803 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.27020442485809326, - "train/contrastive_loss": 1.686435580253601, - "train/negative_loss": 1.6520968675613403, - "train/num_negatives": 46, + "train/classification_loss": 0.29706528782844543, + "train/contrastive_loss": 1.893568992614746, + "train/negative_loss": 1.7392206192016602, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.03433869779109955, - "train/total_loss": 0.6074915528297424 + "train/positive_loss": 0.15434837341308594, + "train/total_loss": 0.6757791042327881 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.31965991854667664, - "train/contrastive_loss": 2.7463219165802, - "train/negative_loss": 2.7463219165802, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.8689242601394653 - }, - { - "epoch": 2.2813688212927756, - "eval_exact_match_accuracy": 0.06285714285714286, - "eval_hamming_loss": 0.08862745098039215, - "eval_loss": 0.7041738629341125, - "eval_macro_f1": 0.03541215817430651, - "eval_macro_precision": 0.05754475703324808, - "eval_macro_recall": 0.02557544757033248, - "eval_micro_f1": 0.18537590113285274, - "eval_micro_precision": 0.9782608695652174, - "eval_micro_recall": 0.10238907849829351, - "eval_runtime": 2.6182, - "eval_samples_per_second": 200.516, - "eval_steps_per_second": 25.208, + "train/classification_loss": 0.29672476649284363, + "train/contrastive_loss": 2.324429988861084, + "train/negative_loss": 2.2799794673919678, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.044450610876083374, + "train/total_loss": 0.761610746383667 + }, + { + "epoch": 2.112676056338028, + "eval_exact_match_accuracy": 0.06701940035273368, + "eval_hamming_loss": 0.08942836393816786, + "eval_loss": 0.7768438458442688, + "eval_macro_f1": 0.03455368161250514, + "eval_macro_precision": 0.053708439897698204, + "eval_macro_recall": 0.025469981807155852, + "eval_micro_f1": 0.16310679611650486, + "eval_micro_precision": 0.9130434782608695, + "eval_micro_recall": 0.08955223880597014, + "eval_runtime": 2.8443, + "eval_samples_per_second": 199.346, + "eval_steps_per_second": 24.962, "step": 600 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.28290507197380066, - "train/contrastive_loss": 1.9128048419952393, - "train/negative_loss": 1.1631848812103271, - "train/num_negatives": 34, - "train/num_positives": 10, - "train/positive_loss": 0.7496199011802673, - "train/total_loss": 0.6654660701751709 + "train/classification_loss": 0.23301708698272705, + "train/contrastive_loss": 1.0185050964355469, + "train/negative_loss": 0.9255691170692444, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.0929359570145607, + "train/total_loss": 0.4367181062698364 }, { - "epoch": 2.2813688212927756, + "epoch": 2.112676056338028, "step": 600, - "train/classification_loss": 0.25435787439346313, - "train/contrastive_loss": 1.531445026397705, - "train/negative_loss": 1.0367933511734009, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.494651734828949, - "train/total_loss": 0.5606468915939331 + "train/classification_loss": 0.30060961842536926, + "train/contrastive_loss": 1.328704833984375, + "train/negative_loss": 1.2900022268295288, + "train/num_negatives": 54, + "train/num_positives": 2, + "train/positive_loss": 0.038702648133039474, + "train/total_loss": 0.5663505792617798 }, { - "epoch": 2.4714828897338403, - "grad_norm": 18.125659942626953, - "learning_rate": 1.991674277016743e-05, - "loss": 1.0761, + "epoch": 2.288732394366197, + "grad_norm": 14.132761001586914, + "learning_rate": 1.9923044397463003e-05, + "loss": 1.141, "step": 650 }, { - "epoch": 2.4714828897338403, + "epoch": 2.288732394366197, "step": 650, - "train/classification_loss": 0.2536318898200989, - "train/contrastive_loss": 1.662573218345642, - "train/negative_loss": 1.0499340295791626, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.6126391887664795, - "train/total_loss": 0.5861465334892273 + "train/classification_loss": 0.26593494415283203, + "train/contrastive_loss": 1.434600591659546, + "train/negative_loss": 1.0088177919387817, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.42578282952308655, + "train/total_loss": 0.5528550744056702 }, { - "epoch": 2.4714828897338403, + "epoch": 2.288732394366197, "step": 650, - "train/classification_loss": 0.22191952168941498, - "train/contrastive_loss": 0.876443088054657, - "train/negative_loss": 0.7585222125053406, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.1179208755493164, - "train/total_loss": 0.39720815420150757 + "train/classification_loss": 0.33469271659851074, + "train/contrastive_loss": 0.9574272632598877, + "train/negative_loss": 0.6218593716621399, + "train/num_negatives": 26, + "train/num_positives": 10, + "train/positive_loss": 0.3355679214000702, + "train/total_loss": 0.5261781811714172 }, { - "epoch": 2.661596958174905, - "grad_norm": 15.646866798400879, - "learning_rate": 1.9909132420091326e-05, - "loss": 1.1008, + "epoch": 2.464788732394366, + "grad_norm": 11.614706993103027, + "learning_rate": 1.991599718111346e-05, + "loss": 1.1276, "step": 700 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2994653284549713, - "train/contrastive_loss": 1.525338888168335, - "train/negative_loss": 0.8201743960380554, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.7051644921302795, - "train/total_loss": 0.6045330762863159 + "train/classification_loss": 0.26160183548927307, + "train/contrastive_loss": 2.009491205215454, + "train/negative_loss": 2.0051932334899902, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.004298079758882523, + "train/total_loss": 0.6635000705718994 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2716904282569885, - "train/contrastive_loss": 2.850911855697632, - "train/negative_loss": 1.7742928266525269, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.076619029045105, - "train/total_loss": 0.8418728113174438 + "train/classification_loss": 0.3489950895309448, + "train/contrastive_loss": 1.4548521041870117, + "train/negative_loss": 1.4246387481689453, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.03021341562271118, + "train/total_loss": 0.6399655342102051 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.22930456697940826, - "train/contrastive_loss": 2.164700508117676, - "train/negative_loss": 1.1694990396499634, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.9952014684677124, - "train/total_loss": 0.6622446775436401 + "train/classification_loss": 0.28580397367477417, + "train/contrastive_loss": 2.9900283813476562, + "train/negative_loss": 1.9930967092514038, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.996931791305542, + "train/total_loss": 0.8838096857070923 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2327769249677658, - "train/contrastive_loss": 2.789598226547241, - "train/negative_loss": 2.1864607334136963, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.6031374335289001, - "train/total_loss": 0.7906966209411621 + "train/classification_loss": 0.19340381026268005, + "train/contrastive_loss": 1.8040951490402222, + "train/negative_loss": 1.3891160488128662, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.41497907042503357, + "train/total_loss": 0.554222822189331 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25711044669151306, - "train/contrastive_loss": 2.615295886993408, - "train/negative_loss": 2.4645838737487793, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.15071196854114532, - "train/total_loss": 0.7801696062088013 + "train/classification_loss": 0.2559998333454132, + "train/contrastive_loss": 3.1747539043426514, + "train/negative_loss": 2.8927342891693115, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.2820196747779846, + "train/total_loss": 0.8909506797790527 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25439080595970154, - "train/contrastive_loss": 2.755465030670166, - "train/negative_loss": 2.1769564151763916, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.578508734703064, - "train/total_loss": 0.8054838180541992 + "train/classification_loss": 0.26788848638534546, + "train/contrastive_loss": 2.892021656036377, + "train/negative_loss": 2.1982061862945557, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6938154101371765, + "train/total_loss": 0.8462928533554077 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.3042704164981842, - "train/contrastive_loss": 1.728822112083435, - "train/negative_loss": 1.3971470594406128, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.33167505264282227, - "train/total_loss": 0.6500348448753357 + "train/classification_loss": 0.24627529084682465, + "train/contrastive_loss": 2.3007020950317383, + "train/negative_loss": 1.1821531057357788, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1185489892959595, + "train/total_loss": 0.7064157128334045 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21240699291229248, - "train/contrastive_loss": 1.6849901676177979, - "train/negative_loss": 1.2934989929199219, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3914911448955536, - "train/total_loss": 0.549405038356781 + "train/classification_loss": 0.27907198667526245, + "train/contrastive_loss": 1.1958181858062744, + "train/negative_loss": 1.195792317390442, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 2.5868750526569784e-05, + "train/total_loss": 0.5182356238365173 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21919921040534973, - "train/contrastive_loss": 2.044989585876465, - "train/negative_loss": 1.932242751121521, + "train/classification_loss": 0.22659878432750702, + "train/contrastive_loss": 1.5324945449829102, + "train/negative_loss": 1.1574326753616333, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.11274679750204086, - "train/total_loss": 0.6281971335411072 + "train/positive_loss": 0.37506192922592163, + "train/total_loss": 0.5330976843833923 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.31865638494491577, - "train/contrastive_loss": 4.073726177215576, - "train/negative_loss": 2.209306478500366, + "train/classification_loss": 0.2787783443927765, + "train/contrastive_loss": 2.935335874557495, + "train/negative_loss": 1.3649426698684692, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.86441969871521, - "train/total_loss": 1.13340163230896 - }, - { - "epoch": 2.661596958174905, - "step": 700, - "train/classification_loss": 0.24157316982746124, - "train/contrastive_loss": 2.4247536659240723, - "train/negative_loss": 2.0164122581481934, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.4083414077758789, - "train/total_loss": 0.7265239357948303 + "train/num_positives": 14, + "train/positive_loss": 1.5703932046890259, + "train/total_loss": 0.8658455610275269 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2076490968465805, - "train/contrastive_loss": 1.747489333152771, - "train/negative_loss": 1.5995473861694336, - "train/num_negatives": 44, + "train/classification_loss": 0.2323508858680725, + "train/contrastive_loss": 1.201979398727417, + "train/negative_loss": 1.1058276891708374, + "train/num_negatives": 38, "train/num_positives": 12, - "train/positive_loss": 0.14794190227985382, - "train/total_loss": 0.5571469664573669 + "train/positive_loss": 0.0961516723036766, + "train/total_loss": 0.4727467894554138 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2757457196712494, - "train/contrastive_loss": 5.1306328773498535, - "train/negative_loss": 3.2522830963134766, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.8783496618270874, - "train/total_loss": 1.3018723726272583 + "train/classification_loss": 0.26310840249061584, + "train/contrastive_loss": 1.5375195741653442, + "train/negative_loss": 1.4847670793533325, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.052752535790205, + "train/total_loss": 0.5706123113632202 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2260957658290863, - "train/contrastive_loss": 1.8585227727890015, - "train/negative_loss": 1.856015920639038, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0025068209506571293, - "train/total_loss": 0.5978003144264221 + "train/classification_loss": 0.26589787006378174, + "train/contrastive_loss": 5.935999870300293, + "train/negative_loss": 3.2628040313720703, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.6731958389282227, + "train/total_loss": 1.4530978202819824 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2045612633228302, - "train/contrastive_loss": 1.9165334701538086, - "train/negative_loss": 1.7333019971847534, + "train/classification_loss": 0.29565703868865967, + "train/contrastive_loss": 1.8856391906738281, + "train/negative_loss": 1.7572426795959473, "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.18323147296905518, - "train/total_loss": 0.5878679752349854 + "train/num_positives": 4, + "train/positive_loss": 0.12839657068252563, + "train/total_loss": 0.6727849245071411 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2293652445077896, - "train/contrastive_loss": 1.1107189655303955, - "train/negative_loss": 0.9884741902351379, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.12224483489990234, - "train/total_loss": 0.4515090584754944 + "train/classification_loss": 0.1868654489517212, + "train/contrastive_loss": 2.650007486343384, + "train/negative_loss": 1.233117938041687, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.4168895483016968, + "train/total_loss": 0.7168669700622559 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29241329431533813, - "train/contrastive_loss": 2.552403211593628, - "train/negative_loss": 1.9390541315078735, - "train/num_negatives": 40, + "train/classification_loss": 0.2679687440395355, + "train/contrastive_loss": 2.0526623725891113, + "train/negative_loss": 1.8156697750091553, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 0.6133490800857544, - "train/total_loss": 0.8028939366340637 + "train/positive_loss": 0.23699267208576202, + "train/total_loss": 0.6785012483596802 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29301896691322327, - "train/contrastive_loss": 1.6143419742584229, - "train/negative_loss": 1.2226470708847046, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.39169493317604065, - "train/total_loss": 0.6158874034881592 + "train/classification_loss": 0.2409229278564453, + "train/contrastive_loss": 2.007019519805908, + "train/negative_loss": 1.8985358476638794, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.10848365724086761, + "train/total_loss": 0.642326831817627 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2892492115497589, - "train/contrastive_loss": 1.7139005661010742, - "train/negative_loss": 1.6992182731628418, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.014682238921523094, - "train/total_loss": 0.6320292949676514 + "train/classification_loss": 0.25849634408950806, + "train/contrastive_loss": 1.664421796798706, + "train/negative_loss": 1.496127724647522, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.1682940572500229, + "train/total_loss": 0.5913807153701782 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.22525863349437714, - "train/contrastive_loss": 2.7267684936523438, - "train/negative_loss": 2.2744290828704834, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4523395299911499, - "train/total_loss": 0.770612359046936 + "train/classification_loss": 0.28674477338790894, + "train/contrastive_loss": 2.489363670349121, + "train/negative_loss": 2.305185556411743, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.18417812883853912, + "train/total_loss": 0.78461754322052 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2927425503730774, - "train/contrastive_loss": 3.7027173042297363, - "train/negative_loss": 1.7385168075561523, - "train/num_negatives": 44, + "train/classification_loss": 0.22376161813735962, + "train/contrastive_loss": 2.142667770385742, + "train/negative_loss": 1.9347009658813477, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.20796677470207214, + "train/total_loss": 0.6522951722145081 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.21757212281227112, + "train/contrastive_loss": 1.4172059297561646, + "train/negative_loss": 1.3893778324127197, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.9642006158828735, - "train/total_loss": 1.0332860946655273 + "train/positive_loss": 0.02782805822789669, + "train/total_loss": 0.5010132789611816 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.3071487247943878, - "train/contrastive_loss": 2.059997320175171, - "train/negative_loss": 1.9074153900146484, - "train/num_negatives": 44, + "train/classification_loss": 0.1990765482187271, + "train/contrastive_loss": 2.7547669410705566, + "train/negative_loss": 2.121692180633545, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.15258201956748962, - "train/total_loss": 0.7191481590270996 + "train/positive_loss": 0.6330747604370117, + "train/total_loss": 0.7500299215316772 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21001872420310974, - "train/contrastive_loss": 1.017821192741394, - "train/negative_loss": 0.868910014629364, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.14891116321086884, - "train/total_loss": 0.413582980632782 + "train/classification_loss": 0.26614558696746826, + "train/contrastive_loss": 1.6581043004989624, + "train/negative_loss": 1.2447292804718018, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.41337499022483826, + "train/total_loss": 0.5977664589881897 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.20443391799926758, - "train/contrastive_loss": 1.5647622346878052, - "train/negative_loss": 0.8424947261810303, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.7222675085067749, - "train/total_loss": 0.5173863768577576 + "train/classification_loss": 0.2881677448749542, + "train/contrastive_loss": 3.0211892127990723, + "train/negative_loss": 1.4713469743728638, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.549842357635498, + "train/total_loss": 0.89240562915802 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.1837853044271469, - "train/contrastive_loss": 1.7038711309432983, - "train/negative_loss": 1.6445629596710205, + "train/classification_loss": 0.26242172718048096, + "train/contrastive_loss": 1.866014003753662, + "train/negative_loss": 1.0343221426010132, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.05930814519524574, - "train/total_loss": 0.5245595574378967 + "train/num_positives": 10, + "train/positive_loss": 0.8316918611526489, + "train/total_loss": 0.6356245279312134 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29376256465911865, - "train/contrastive_loss": 1.1775813102722168, - "train/negative_loss": 0.248218834400177, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9293625354766846, - "train/total_loss": 0.5292788147926331 + "train/classification_loss": 0.25315940380096436, + "train/contrastive_loss": 3.169330596923828, + "train/negative_loss": 2.0961296558380127, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0732009410858154, + "train/total_loss": 0.8870255351066589 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2838677167892456, - "train/contrastive_loss": 1.9853549003601074, - "train/negative_loss": 1.9708870649337769, + "train/classification_loss": 0.2769738435745239, + "train/contrastive_loss": 2.8473868370056152, + "train/negative_loss": 2.842177152633667, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.014467819593846798, - "train/total_loss": 0.680938720703125 + "train/num_positives": 4, + "train/positive_loss": 0.005209724418818951, + "train/total_loss": 0.8464512228965759 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2653903067111969, - "train/contrastive_loss": 2.4695611000061035, - "train/negative_loss": 2.1538469791412354, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.31571418046951294, - "train/total_loss": 0.7593024969100952 + "train/classification_loss": 0.2702639102935791, + "train/contrastive_loss": 0.43696677684783936, + "train/negative_loss": 0.4276716709136963, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.009295119903981686, + "train/total_loss": 0.357657253742218 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2679423689842224, - "train/contrastive_loss": 1.2107802629470825, - "train/negative_loss": 1.1737455129623413, - "train/num_negatives": 40, + "train/classification_loss": 0.2649320363998413, + "train/contrastive_loss": 4.0508856773376465, + "train/negative_loss": 1.8131588697433472, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.0370347835123539, - "train/total_loss": 0.5100984573364258 + "train/positive_loss": 2.237726926803589, + "train/total_loss": 1.0751092433929443 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2834407091140747, - "train/contrastive_loss": 2.566127300262451, - "train/negative_loss": 2.115593433380127, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.4505338668823242, - "train/total_loss": 0.7966662049293518 + "train/classification_loss": 0.3046039640903473, + "train/contrastive_loss": 1.2810300588607788, + "train/negative_loss": 1.1386232376098633, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.14240680634975433, + "train/total_loss": 0.5608099699020386 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2563798129558563, - "train/contrastive_loss": 1.9317893981933594, - "train/negative_loss": 0.9889421463012695, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.9428472518920898, - "train/total_loss": 0.6427376866340637 + "train/classification_loss": 0.21259135007858276, + "train/contrastive_loss": 1.4091565608978271, + "train/negative_loss": 1.408933401107788, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0002231640974059701, + "train/total_loss": 0.49442267417907715 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.26408088207244873, - "train/contrastive_loss": 3.406033515930176, - "train/negative_loss": 2.6770663261413574, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7289670705795288, - "train/total_loss": 0.9452875852584839 + "train/classification_loss": 0.2486288696527481, + "train/contrastive_loss": 4.611261367797852, + "train/negative_loss": 2.3544013500213623, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.2568600177764893, + "train/total_loss": 1.1708811521530151 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.3245859444141388, - "train/contrastive_loss": 1.3018834590911865, - "train/negative_loss": 1.301150918006897, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007325112819671631, - "train/total_loss": 0.5849626064300537 + "train/classification_loss": 0.25692251324653625, + "train/contrastive_loss": 3.3561017513275146, + "train/negative_loss": 2.010610580444336, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.3454911708831787, + "train/total_loss": 0.9281429052352905 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.27598485350608826, - "train/contrastive_loss": 2.359105348587036, - "train/negative_loss": 2.032038927078247, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.32706642150878906, - "train/total_loss": 0.7478059530258179 + "train/classification_loss": 0.27464237809181213, + "train/contrastive_loss": 1.9858033657073975, + "train/negative_loss": 1.7059353590011597, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.2798679769039154, + "train/total_loss": 0.6718030571937561 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25861242413520813, - "train/contrastive_loss": 3.1143689155578613, - "train/negative_loss": 2.5002758502960205, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.6140931844711304, - "train/total_loss": 0.881486177444458 + "train/classification_loss": 0.31064096093177795, + "train/contrastive_loss": 2.6247735023498535, + "train/negative_loss": 2.1107285022735596, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.514045000076294, + "train/total_loss": 0.8355957269668579 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23103652894496918, - "train/contrastive_loss": 3.6791999340057373, - "train/negative_loss": 2.2417356967926025, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.4374642372131348, - "train/total_loss": 0.9668765664100647 + "train/classification_loss": 0.19985580444335938, + "train/contrastive_loss": 3.0397794246673584, + "train/negative_loss": 2.7400920391082764, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.29968732595443726, + "train/total_loss": 0.8078116774559021 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.24488118290901184, - "train/contrastive_loss": 3.0132226943969727, - "train/negative_loss": 2.4720757007598877, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5411471128463745, - "train/total_loss": 0.8475257158279419 + "train/classification_loss": 0.27227783203125, + "train/contrastive_loss": 1.791211485862732, + "train/negative_loss": 1.4521441459655762, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.33906733989715576, + "train/total_loss": 0.6305201053619385 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23817351460456848, - "train/contrastive_loss": 1.8667124509811401, - "train/negative_loss": 1.7049696445465088, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.16174279153347015, - "train/total_loss": 0.611515998840332 + "train/classification_loss": 0.3416289985179901, + "train/contrastive_loss": 3.330692768096924, + "train/negative_loss": 3.3222756385803223, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.00841722171753645, + "train/total_loss": 1.0077675580978394 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2799569368362427, - "train/contrastive_loss": 1.3443957567214966, - "train/negative_loss": 1.340288758277893, - "train/num_negatives": 46, + "train/classification_loss": 0.26505497097969055, + "train/contrastive_loss": 0.704699695110321, + "train/negative_loss": 0.7026187777519226, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.002080937847495079, + "train/total_loss": 0.40599489212036133 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.29826709628105164, + "train/contrastive_loss": 4.536911964416504, + "train/negative_loss": 2.966407299041748, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.004106984008103609, - "train/total_loss": 0.5488361120223999 + "train/positive_loss": 1.5705044269561768, + "train/total_loss": 1.205649495124817 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25153419375419617, - "train/contrastive_loss": 1.8644427061080933, - "train/negative_loss": 1.8633028268814087, + "train/classification_loss": 0.20360641181468964, + "train/contrastive_loss": 1.3062645196914673, + "train/negative_loss": 1.0606977939605713, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0011399326613172889, - "train/total_loss": 0.6244227290153503 + "train/num_positives": 10, + "train/positive_loss": 0.24556677043437958, + "train/total_loss": 0.4648593068122864 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.22966787219047546, + "train/contrastive_loss": 3.801238536834717, + "train/negative_loss": 2.7578775882720947, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.0433610677719116, + "train/total_loss": 0.9899156093597412 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.2880914807319641, + "train/contrastive_loss": 1.2372689247131348, + "train/negative_loss": 1.1856848001480103, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0515841506421566, + "train/total_loss": 0.535545289516449 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.22809238731861115, - "train/contrastive_loss": 0.806515097618103, - "train/negative_loss": 0.8063143491744995, + "train/classification_loss": 0.2807157635688782, + "train/contrastive_loss": 2.0164473056793213, + "train/negative_loss": 2.014331102371216, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.00020072566985618323, - "train/total_loss": 0.38939541578292847 + "train/positive_loss": 0.0021161732729524374, + "train/total_loss": 0.6840052604675293 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23821842670440674, - "train/contrastive_loss": 1.9262007474899292, - "train/negative_loss": 1.8183670043945312, - "train/num_negatives": 36, + "train/classification_loss": 0.27108246088027954, + "train/contrastive_loss": 1.4438271522521973, + "train/negative_loss": 1.2064590454101562, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.2373681366443634, + "train/total_loss": 0.559847891330719 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.33205175399780273, + "train/contrastive_loss": 2.6006836891174316, + "train/negative_loss": 2.2137322425842285, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.10783372074365616, - "train/total_loss": 0.6234586238861084 + "train/positive_loss": 0.38695135712623596, + "train/total_loss": 0.8521885275840759 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29103705286979675, - "train/contrastive_loss": 2.0493345260620117, - "train/negative_loss": 1.5532599687576294, + "train/classification_loss": 0.23320068418979645, + "train/contrastive_loss": 2.6594433784484863, + "train/negative_loss": 1.4917128086090088, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.167730450630188, + "train/total_loss": 0.7650893330574036 + }, + { + "epoch": 2.464788732394366, + "step": 700, + "train/classification_loss": 0.2598276436328888, + "train/contrastive_loss": 1.8245913982391357, + "train/negative_loss": 1.3977611064910889, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.4960744380950928, - "train/total_loss": 0.7009039521217346 + "train/num_positives": 14, + "train/positive_loss": 0.4268302321434021, + "train/total_loss": 0.6247459650039673 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23092569410800934, - "train/contrastive_loss": 2.2218081951141357, - "train/negative_loss": 1.9143059253692627, + "train/classification_loss": 0.2979010343551636, + "train/contrastive_loss": 2.5640647411346436, + "train/negative_loss": 2.5639495849609375, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.30750226974487305, - "train/total_loss": 0.6752873659133911 + "train/num_positives": 2, + "train/positive_loss": 0.00011516280210344121, + "train/total_loss": 0.8107140064239502 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.22102051973342896, - "train/contrastive_loss": 0.9490668177604675, - "train/negative_loss": 0.6527988314628601, + "train/classification_loss": 0.23783941566944122, + "train/contrastive_loss": 2.694197654724121, + "train/negative_loss": 1.6137291193008423, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2962679862976074, - "train/total_loss": 0.4108338952064514 + "train/num_positives": 16, + "train/positive_loss": 1.0804685354232788, + "train/total_loss": 0.7766789197921753 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.32533833384513855, - "train/contrastive_loss": 2.0928139686584473, - "train/negative_loss": 1.8137067556381226, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.27910709381103516, - "train/total_loss": 0.7439011335372925 + "train/classification_loss": 0.2812771201133728, + "train/contrastive_loss": 2.404744863510132, + "train/negative_loss": 2.1674630641937256, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.23728182911872864, + "train/total_loss": 0.7622261047363281 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.20622886717319489, - "train/contrastive_loss": 1.5176365375518799, - "train/negative_loss": 1.5175575017929077, - "train/num_negatives": 48, + "train/classification_loss": 0.2981731593608856, + "train/contrastive_loss": 0.9076513051986694, + "train/negative_loss": 0.8752302527427673, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 7.906969403848052e-05, - "train/total_loss": 0.5097562074661255 + "train/positive_loss": 0.03242107480764389, + "train/total_loss": 0.479703426361084 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.24132312834262848, - "train/contrastive_loss": 0.37347301840782166, - "train/negative_loss": 0.3601992428302765, + "train/classification_loss": 0.26617908477783203, + "train/contrastive_loss": 1.1268925666809082, + "train/negative_loss": 0.8994209170341492, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.013273782096803188, - "train/total_loss": 0.316017746925354 + "train/num_positives": 14, + "train/positive_loss": 0.22747159004211426, + "train/total_loss": 0.49155759811401367 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21682921051979065, - "train/contrastive_loss": 1.019074559211731, - "train/negative_loss": 1.008063554763794, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.011011029593646526, - "train/total_loss": 0.4206441044807434 + "train/classification_loss": 0.34852468967437744, + "train/contrastive_loss": 2.451164722442627, + "train/negative_loss": 2.0943233966827393, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.3568412661552429, + "train/total_loss": 0.8387576341629028 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29464709758758545, - "train/contrastive_loss": 0.6986509561538696, - "train/negative_loss": 0.3485206067562103, - "train/num_negatives": 28, + "train/classification_loss": 0.21351921558380127, + "train/contrastive_loss": 1.3077449798583984, + "train/negative_loss": 1.2763208150863647, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.3501303195953369, - "train/total_loss": 0.4343773126602173 + "train/positive_loss": 0.03142421320080757, + "train/total_loss": 0.47506821155548096 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.258434534072876, - "train/contrastive_loss": 2.3623549938201904, - "train/negative_loss": 2.0024938583374023, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.35986122488975525, - "train/total_loss": 0.7309055328369141 + "train/classification_loss": 0.22098085284233093, + "train/contrastive_loss": 1.252382755279541, + "train/negative_loss": 0.9320904612541199, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.32029226422309875, + "train/total_loss": 0.47145742177963257 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23046980798244476, - "train/contrastive_loss": 1.1544729471206665, - "train/negative_loss": 1.1530126333236694, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0014603384770452976, - "train/total_loss": 0.46136438846588135 + "train/classification_loss": 0.24900402128696442, + "train/contrastive_loss": 1.5956631898880005, + "train/negative_loss": 1.4973597526550293, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.09830348938703537, + "train/total_loss": 0.5681366920471191 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.24745330214500427, - "train/contrastive_loss": 2.3149478435516357, - "train/negative_loss": 1.0244983434677124, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2904495000839233, - "train/total_loss": 0.7104429006576538 + "train/classification_loss": 0.2717909514904022, + "train/contrastive_loss": 3.126350164413452, + "train/negative_loss": 2.1042404174804688, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.0221097469329834, + "train/total_loss": 0.8970609903335571 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2671908736228943, - "train/contrastive_loss": 4.058802604675293, - "train/negative_loss": 3.243508815765381, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8152940273284912, - "train/total_loss": 1.078951358795166 + "train/classification_loss": 0.27638933062553406, + "train/contrastive_loss": 2.0312418937683105, + "train/negative_loss": 1.7461339235305786, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.2851078510284424, + "train/total_loss": 0.6826376914978027 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25356361269950867, - "train/contrastive_loss": 1.608991026878357, - "train/negative_loss": 0.7582995295524597, + "train/classification_loss": 0.22918930649757385, + "train/contrastive_loss": 0.6197246313095093, + "train/negative_loss": 0.5883871912956238, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8506914973258972, - "train/total_loss": 0.5753618478775024 + "train/num_positives": 16, + "train/positive_loss": 0.03133746609091759, + "train/total_loss": 0.35313424468040466 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.22574490308761597, - "train/contrastive_loss": 3.8971784114837646, - "train/negative_loss": 2.6883766651153564, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2088017463684082, - "train/total_loss": 1.0051805973052979 + "train/classification_loss": 0.25562724471092224, + "train/contrastive_loss": 2.7033188343048096, + "train/negative_loss": 1.738297700881958, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.9650211334228516, + "train/total_loss": 0.7962909936904907 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.29417672753334045, - "train/contrastive_loss": 3.1986939907073975, - "train/negative_loss": 1.8751858472824097, + "train/classification_loss": 0.2959875464439392, + "train/contrastive_loss": 2.5730886459350586, + "train/negative_loss": 2.090815544128418, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.3235081434249878, - "train/total_loss": 0.9339154958724976 + "train/num_positives": 2, + "train/positive_loss": 0.4822732210159302, + "train/total_loss": 0.8106052875518799 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2525008022785187, - "train/contrastive_loss": 2.3908090591430664, - "train/negative_loss": 2.372826337814331, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.017982831224799156, - "train/total_loss": 0.7306625843048096 + "train/classification_loss": 0.20701751112937927, + "train/contrastive_loss": 2.353665351867676, + "train/negative_loss": 1.7266006469726562, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.62706458568573, + "train/total_loss": 0.6777505874633789 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21399809420108795, - "train/contrastive_loss": 2.346482515335083, - "train/negative_loss": 1.5640166997909546, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7824658751487732, - "train/total_loss": 0.6832945942878723 + "train/classification_loss": 0.2567755877971649, + "train/contrastive_loss": 2.0725317001342773, + "train/negative_loss": 1.6104071140289307, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.46212470531463623, + "train/total_loss": 0.6712819337844849 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.23734401166439056, - "train/contrastive_loss": 2.165987491607666, - "train/negative_loss": 1.6359527111053467, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5300347208976746, - "train/total_loss": 0.670541524887085 + "train/classification_loss": 0.2919117510318756, + "train/contrastive_loss": 2.773078680038452, + "train/negative_loss": 1.5652027130126953, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.2078759670257568, + "train/total_loss": 0.8465274572372437 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.26203396916389465, - "train/contrastive_loss": 4.567227363586426, - "train/negative_loss": 3.838006019592285, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.729221522808075, - "train/total_loss": 1.1754794120788574 + "train/classification_loss": 0.24964767694473267, + "train/contrastive_loss": 4.710105895996094, + "train/negative_loss": 4.71002721786499, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 7.888646359788254e-05, + "train/total_loss": 1.1916688680648804 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.26599910855293274, - "train/contrastive_loss": 3.8680429458618164, - "train/negative_loss": 2.356389045715332, + "train/classification_loss": 0.279945969581604, + "train/contrastive_loss": 1.2637437582015991, + "train/negative_loss": 1.243511438369751, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.5116537809371948, - "train/total_loss": 1.0396077632904053 + "train/positive_loss": 0.020232265815138817, + "train/total_loss": 0.5326946973800659 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.25672394037246704, - "train/contrastive_loss": 0.672511100769043, - "train/negative_loss": 0.6421878337860107, + "train/classification_loss": 0.26825597882270813, + "train/contrastive_loss": 2.8947269916534424, + "train/negative_loss": 2.7786574363708496, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.03032328188419342, - "train/total_loss": 0.3912261724472046 + "train/num_positives": 8, + "train/positive_loss": 0.11606947332620621, + "train/total_loss": 0.8472013473510742 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.217296302318573, - "train/contrastive_loss": 2.443679094314575, - "train/negative_loss": 2.2321937084198, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.2114853709936142, - "train/total_loss": 0.7060321569442749 + "train/classification_loss": 0.21056686341762543, + "train/contrastive_loss": 1.890453815460205, + "train/negative_loss": 1.755068063735962, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.13538573682308197, + "train/total_loss": 0.5886576175689697 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.2646985352039337, - "train/contrastive_loss": 1.5904335975646973, - "train/negative_loss": 1.5195107460021973, - "train/num_negatives": 46, + "train/classification_loss": 0.2907728850841522, + "train/contrastive_loss": 1.5807266235351562, + "train/negative_loss": 1.4380918741226196, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.0709228590130806, - "train/total_loss": 0.5827852487564087 + "train/positive_loss": 0.1426348090171814, + "train/total_loss": 0.606918215751648 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.31466665863990784, - "train/contrastive_loss": 2.216660976409912, - "train/negative_loss": 2.216660976409912, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.7579988241195679 - }, - { - "epoch": 2.661596958174905, - "eval_exact_match_accuracy": 0.08, - "eval_hamming_loss": 0.0869467787114846, - "eval_loss": 0.694094717502594, - "eval_macro_f1": 0.03994190268700073, - "eval_macro_precision": 0.05530417295123177, - "eval_macro_recall": 0.0312588803637397, - "eval_micro_f1": 0.22088353413654618, - "eval_micro_precision": 0.9401709401709402, - "eval_micro_recall": 0.12514220705346984, - "eval_runtime": 2.6231, - "eval_samples_per_second": 200.146, - "eval_steps_per_second": 25.161, + "train/classification_loss": 0.29031291604042053, + "train/contrastive_loss": 1.907941460609436, + "train/negative_loss": 1.5485501289367676, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.35939133167266846, + "train/total_loss": 0.6719012260437012 + }, + { + "epoch": 2.464788732394366, + "eval_exact_match_accuracy": 0.08641975308641975, + "eval_hamming_loss": 0.08828716671853927, + "eval_loss": 0.7173317670822144, + "eval_macro_f1": 0.03832151753209427, + "eval_macro_precision": 0.052056220718375845, + "eval_macro_recall": 0.030321406913280773, + "eval_micro_f1": 0.19029495718363462, + "eval_micro_precision": 0.8849557522123894, + "eval_micro_recall": 0.10660980810234541, + "eval_runtime": 2.8445, + "eval_samples_per_second": 199.329, + "eval_steps_per_second": 24.96, "step": 700 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.234074205160141, - "train/contrastive_loss": 1.146761417388916, - "train/negative_loss": 0.8328234553337097, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3139380216598511, - "train/total_loss": 0.46342647075653076 + "train/classification_loss": 0.2534940540790558, + "train/contrastive_loss": 1.2565116882324219, + "train/negative_loss": 1.11784827709198, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.1386633664369583, + "train/total_loss": 0.5047963857650757 }, { - "epoch": 2.661596958174905, + "epoch": 2.464788732394366, "step": 700, - "train/classification_loss": 0.21601387858390808, - "train/contrastive_loss": 1.5864155292510986, - "train/negative_loss": 1.1961942911148071, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3902212679386139, - "train/total_loss": 0.5332970023155212 + "train/classification_loss": 0.17683963477611542, + "train/contrastive_loss": 1.7005207538604736, + "train/negative_loss": 1.2565371990203857, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.4439835548400879, + "train/total_loss": 0.5169438123703003 }, { - "epoch": 2.8517110266159698, - "grad_norm": 10.527934074401855, - "learning_rate": 1.990152207001522e-05, - "loss": 1.0576, + "epoch": 2.640845070422535, + "grad_norm": 12.585654258728027, + "learning_rate": 1.990894996476392e-05, + "loss": 1.07, "step": 750 }, { - "epoch": 2.8517110266159698, + "epoch": 2.640845070422535, "step": 750, - "train/classification_loss": 0.24150267243385315, - "train/contrastive_loss": 1.3705381155014038, - "train/negative_loss": 0.967003583908081, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.40353450179100037, - "train/total_loss": 0.5156103372573853 + "train/classification_loss": 0.2328159660100937, + "train/contrastive_loss": 1.05596923828125, + "train/negative_loss": 0.9213714599609375, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.1345977932214737, + "train/total_loss": 0.44400981068611145 }, { - "epoch": 2.8517110266159698, + "epoch": 2.640845070422535, "step": 750, - "train/classification_loss": 0.2635066509246826, - "train/contrastive_loss": 0.9432570934295654, - "train/negative_loss": 0.8198953866958618, - "train/num_negatives": 14, - "train/num_positives": 28, - "train/positive_loss": 0.12336168438196182, - "train/total_loss": 0.4521580934524536 + "train/classification_loss": 0.2837826907634735, + "train/contrastive_loss": 1.1195340156555176, + "train/negative_loss": 1.021483063697815, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.09805101156234741, + "train/total_loss": 0.5076894760131836 }, { - "epoch": 3.041825095057034, - "grad_norm": 11.493776321411133, - "learning_rate": 1.989391171993912e-05, - "loss": 1.0646, + "epoch": 2.816901408450704, + "grad_norm": 16.904903411865234, + "learning_rate": 1.990190274841438e-05, + "loss": 1.1083, "step": 800 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.29314079880714417, - "train/contrastive_loss": 2.383169651031494, - "train/negative_loss": 0.805569589138031, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.577600121498108, - "train/total_loss": 0.7697747349739075 + "train/classification_loss": 0.25530996918678284, + "train/contrastive_loss": 2.436138153076172, + "train/negative_loss": 2.422919750213623, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.013218455947935581, + "train/total_loss": 0.7425376176834106 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2656731903553009, - "train/contrastive_loss": 2.591348171234131, - "train/negative_loss": 1.4698973894119263, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.1214507818222046, - "train/total_loss": 0.7839428186416626 + "train/classification_loss": 0.3374779522418976, + "train/contrastive_loss": 1.0352551937103271, + "train/negative_loss": 1.0000343322753906, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.03522083908319473, + "train/total_loss": 0.5445289611816406 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22482506930828094, - "train/contrastive_loss": 2.3044028282165527, - "train/negative_loss": 1.134595513343811, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1698074340820312, - "train/total_loss": 0.6857056617736816 + "train/classification_loss": 0.28194302320480347, + "train/contrastive_loss": 2.598475456237793, + "train/negative_loss": 1.653485655784607, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9449899196624756, + "train/total_loss": 0.801638126373291 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22757911682128906, - "train/contrastive_loss": 3.369941234588623, - "train/negative_loss": 2.4030258655548096, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9669153690338135, - "train/total_loss": 0.9015673995018005 + "train/classification_loss": 0.18934272229671478, + "train/contrastive_loss": 1.750364065170288, + "train/negative_loss": 1.53482186794281, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.21554219722747803, + "train/total_loss": 0.5394155383110046 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.246128648519516, - "train/contrastive_loss": 1.7975577116012573, - "train/negative_loss": 1.399200201034546, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.3983575105667114, - "train/total_loss": 0.605640172958374 + "train/classification_loss": 0.25565478205680847, + "train/contrastive_loss": 3.2658021450042725, + "train/negative_loss": 2.750257730484009, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.5155444741249084, + "train/total_loss": 0.9088152647018433 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24048179388046265, - "train/contrastive_loss": 1.7777180671691895, - "train/negative_loss": 1.4796899557113647, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.29802805185317993, - "train/total_loss": 0.5960254073143005 + "train/classification_loss": 0.26185911893844604, + "train/contrastive_loss": 2.891963005065918, + "train/negative_loss": 2.178420305252075, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.7135428190231323, + "train/total_loss": 0.8402517437934875 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2954685389995575, - "train/contrastive_loss": 1.4352374076843262, - "train/negative_loss": 1.2044974565505981, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.23073995113372803, - "train/total_loss": 0.5825160145759583 + "train/classification_loss": 0.24465319514274597, + "train/contrastive_loss": 2.005976915359497, + "train/negative_loss": 1.4147852659225464, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.5911916494369507, + "train/total_loss": 0.6458485722541809 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.20385415852069855, - "train/contrastive_loss": 1.6039866209030151, - "train/negative_loss": 1.1961826086044312, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4078039824962616, - "train/total_loss": 0.5246514678001404 + "train/classification_loss": 0.2738387882709503, + "train/contrastive_loss": 1.1176095008850098, + "train/negative_loss": 1.1175786256790161, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 3.087568256887607e-05, + "train/total_loss": 0.4973607063293457 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2125495821237564, - "train/contrastive_loss": 1.6281113624572754, - "train/negative_loss": 1.4874811172485352, + "train/classification_loss": 0.21923665702342987, + "train/contrastive_loss": 1.5575358867645264, + "train/negative_loss": 1.2310187816619873, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.14063027501106262, - "train/total_loss": 0.5381718873977661 + "train/positive_loss": 0.32651710510253906, + "train/total_loss": 0.5307438373565674 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.3155806064605713, - "train/contrastive_loss": 3.361018657684326, - "train/negative_loss": 2.1817634105682373, + "train/classification_loss": 0.27326807379722595, + "train/contrastive_loss": 3.082857131958008, + "train/negative_loss": 1.7860063314437866, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1792552471160889, - "train/total_loss": 0.9877843260765076 - }, - { - "epoch": 3.041825095057034, - "step": 800, - "train/classification_loss": 0.23360858857631683, - "train/contrastive_loss": 1.70940101146698, - "train/negative_loss": 1.3597558736801147, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3496451675891876, - "train/total_loss": 0.575488805770874 + "train/num_positives": 14, + "train/positive_loss": 1.2968506813049316, + "train/total_loss": 0.8898395299911499 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.19763028621673584, - "train/contrastive_loss": 1.5345540046691895, - "train/negative_loss": 1.0616207122802734, - "train/num_negatives": 44, + "train/classification_loss": 0.22566792368888855, + "train/contrastive_loss": 1.2392702102661133, + "train/negative_loss": 1.046807050704956, + "train/num_negatives": 38, "train/num_positives": 12, - "train/positive_loss": 0.472933292388916, - "train/total_loss": 0.5045410990715027 + "train/positive_loss": 0.19246315956115723, + "train/total_loss": 0.4735219478607178 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2667146921157837, - "train/contrastive_loss": 3.7035183906555176, - "train/negative_loss": 2.3754942417144775, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.3280240297317505, - "train/total_loss": 1.0074183940887451 + "train/classification_loss": 0.2538541853427887, + "train/contrastive_loss": 1.246451735496521, + "train/negative_loss": 1.2069483995437622, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.03950328752398491, + "train/total_loss": 0.5031445026397705 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21415624022483826, - "train/contrastive_loss": 1.3674054145812988, - "train/negative_loss": 1.3668683767318726, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0005370261496864259, - "train/total_loss": 0.48763734102249146 + "train/classification_loss": 0.25708866119384766, + "train/contrastive_loss": 4.670703887939453, + "train/negative_loss": 3.3335177898406982, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3371858596801758, + "train/total_loss": 1.1912294626235962 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.197384774684906, - "train/contrastive_loss": 1.4736162424087524, - "train/negative_loss": 1.2754184007644653, + "train/classification_loss": 0.29008904099464417, + "train/contrastive_loss": 2.7323391437530518, + "train/negative_loss": 2.552006244659424, "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.1981978714466095, - "train/total_loss": 0.492108017206192 + "train/num_positives": 4, + "train/positive_loss": 0.1803329586982727, + "train/total_loss": 0.8365569114685059 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2141173779964447, - "train/contrastive_loss": 0.9334440231323242, - "train/negative_loss": 0.8736681342124939, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.059775885194540024, - "train/total_loss": 0.400806188583374 + "train/classification_loss": 0.18288853764533997, + "train/contrastive_loss": 2.640139579772949, + "train/negative_loss": 1.3435602188110352, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.296579360961914, + "train/total_loss": 0.7109165191650391 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.27988478541374207, - "train/contrastive_loss": 2.3908724784851074, - "train/negative_loss": 2.0412967205047607, - "train/num_negatives": 40, + "train/classification_loss": 0.25801247358322144, + "train/contrastive_loss": 2.0654172897338867, + "train/negative_loss": 1.4576373100280762, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 0.34957581758499146, - "train/total_loss": 0.7580592632293701 + "train/positive_loss": 0.6077799201011658, + "train/total_loss": 0.6710959672927856 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2827722430229187, - "train/contrastive_loss": 1.3552918434143066, - "train/negative_loss": 0.7655489444732666, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.5897429585456848, - "train/total_loss": 0.553830623626709 + "train/classification_loss": 0.2303646057844162, + "train/contrastive_loss": 1.7863417863845825, + "train/negative_loss": 1.3515750169754028, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4347667992115021, + "train/total_loss": 0.587632954120636 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.27720171213150024, - "train/contrastive_loss": 1.2963272333145142, - "train/negative_loss": 1.293222188949585, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.003105047158896923, - "train/total_loss": 0.5364671945571899 + "train/classification_loss": 0.24760179221630096, + "train/contrastive_loss": 2.480180263519287, + "train/negative_loss": 2.380378484725952, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.09980181604623795, + "train/total_loss": 0.7436378598213196 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21916240453720093, - "train/contrastive_loss": 2.5268235206604004, - "train/negative_loss": 1.8513298034667969, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6754936575889587, - "train/total_loss": 0.72452712059021 + "train/classification_loss": 0.27540767192840576, + "train/contrastive_loss": 2.197237253189087, + "train/negative_loss": 2.103907346725464, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.093330018222332, + "train/total_loss": 0.7148551344871521 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2867974042892456, - "train/contrastive_loss": 2.719491481781006, - "train/negative_loss": 1.2099329233169556, - "train/num_negatives": 44, + "train/classification_loss": 0.21698682010173798, + "train/contrastive_loss": 3.030367612838745, + "train/negative_loss": 2.7388713359832764, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.29149627685546875, + "train/total_loss": 0.8230603933334351 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.21215276420116425, + "train/contrastive_loss": 1.6111845970153809, + "train/negative_loss": 1.593361258506775, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.5095586776733398, - "train/total_loss": 0.8306956887245178 + "train/positive_loss": 0.017823360860347748, + "train/total_loss": 0.5343896746635437 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.3019503653049469, - "train/contrastive_loss": 1.7880195379257202, - "train/negative_loss": 1.5809377431869507, - "train/num_negatives": 44, + "train/classification_loss": 0.19150559604167938, + "train/contrastive_loss": 2.1677191257476807, + "train/negative_loss": 2.014702796936035, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.20708177983760834, - "train/total_loss": 0.6595542430877686 + "train/positive_loss": 0.15301623940467834, + "train/total_loss": 0.6250494122505188 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.20283930003643036, - "train/contrastive_loss": 0.5293982625007629, - "train/negative_loss": 0.3605397045612335, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.16885855793952942, - "train/total_loss": 0.3087189495563507 + "train/classification_loss": 0.2543528079986572, + "train/contrastive_loss": 1.461971640586853, + "train/negative_loss": 1.1034489870071411, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.3585226535797119, + "train/total_loss": 0.5467471480369568 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.19196805357933044, - "train/contrastive_loss": 1.1378841400146484, - "train/negative_loss": 0.44153982400894165, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.6963443756103516, - "train/total_loss": 0.41954487562179565 + "train/classification_loss": 0.28685474395751953, + "train/contrastive_loss": 2.5784759521484375, + "train/negative_loss": 1.704355239868164, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.8741205930709839, + "train/total_loss": 0.8025499582290649 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.17623770236968994, - "train/contrastive_loss": 1.7271051406860352, - "train/negative_loss": 1.631600022315979, + "train/classification_loss": 0.25493335723876953, + "train/contrastive_loss": 2.051750421524048, + "train/negative_loss": 1.2813271284103394, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.09550506621599197, - "train/total_loss": 0.5216587781906128 + "train/num_positives": 10, + "train/positive_loss": 0.7704232931137085, + "train/total_loss": 0.6652834415435791 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.28964459896087646, - "train/contrastive_loss": 1.2389191389083862, - "train/negative_loss": 0.31056642532348633, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9283527135848999, - "train/total_loss": 0.5374284386634827 + "train/classification_loss": 0.24819374084472656, + "train/contrastive_loss": 1.961195945739746, + "train/negative_loss": 1.8431615829467773, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.11803442239761353, + "train/total_loss": 0.6404329538345337 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.276525616645813, - "train/contrastive_loss": 1.9517097473144531, - "train/negative_loss": 1.579936146736145, + "train/classification_loss": 0.2704271674156189, + "train/contrastive_loss": 2.840777635574341, + "train/negative_loss": 2.760887622833252, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.3717735707759857, - "train/total_loss": 0.6668676137924194 + "train/num_positives": 4, + "train/positive_loss": 0.07989010959863663, + "train/total_loss": 0.8385826945304871 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.25884830951690674, - "train/contrastive_loss": 1.5889256000518799, - "train/negative_loss": 1.3588613271713257, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.23006421327590942, - "train/total_loss": 0.5766334533691406 + "train/classification_loss": 0.26017406582832336, + "train/contrastive_loss": 0.879958987236023, + "train/negative_loss": 0.8019862771034241, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.07797269523143768, + "train/total_loss": 0.43616586923599243 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2580476999282837, - "train/contrastive_loss": 0.7779901027679443, - "train/negative_loss": 0.7621481418609619, - "train/num_negatives": 40, + "train/classification_loss": 0.26372599601745605, + "train/contrastive_loss": 3.3286662101745605, + "train/negative_loss": 2.2956743240356445, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.01584198884665966, - "train/total_loss": 0.41364574432373047 + "train/positive_loss": 1.0329917669296265, + "train/total_loss": 0.929459273815155 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2733430862426758, - "train/contrastive_loss": 3.6050033569335938, - "train/negative_loss": 2.8822522163391113, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.722751259803772, - "train/total_loss": 0.9943437576293945 + "train/classification_loss": 0.2945454716682434, + "train/contrastive_loss": 1.7435551881790161, + "train/negative_loss": 1.708172082901001, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.03538309410214424, + "train/total_loss": 0.6432565450668335 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24679383635520935, - "train/contrastive_loss": 1.8601853847503662, - "train/negative_loss": 1.0215765237808228, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8386088013648987, - "train/total_loss": 0.6188309192657471 + "train/classification_loss": 0.2104320377111435, + "train/contrastive_loss": 1.5684928894042969, + "train/negative_loss": 1.5593011379241943, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.009191783145070076, + "train/total_loss": 0.524130642414093 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2583808898925781, - "train/contrastive_loss": 2.4103784561157227, - "train/negative_loss": 1.5457758903503418, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8646025657653809, - "train/total_loss": 0.7404565811157227 + "train/classification_loss": 0.23950229585170746, + "train/contrastive_loss": 3.3051068782806396, + "train/negative_loss": 2.5042731761932373, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8008337020874023, + "train/total_loss": 0.9005237221717834 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.31191787123680115, - "train/contrastive_loss": 1.0270315408706665, - "train/negative_loss": 1.0257138013839722, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.001317713176831603, - "train/total_loss": 0.5173242092132568 + "train/classification_loss": 0.24864685535430908, + "train/contrastive_loss": 2.874927520751953, + "train/negative_loss": 1.861314296722412, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.013613224029541, + "train/total_loss": 0.8236323595046997 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.26750773191452026, - "train/contrastive_loss": 1.855283260345459, - "train/negative_loss": 1.4683990478515625, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.3868842124938965, - "train/total_loss": 0.6385643482208252 + "train/classification_loss": 0.26860445737838745, + "train/contrastive_loss": 2.1972618103027344, + "train/negative_loss": 2.1391520500183105, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.05810968205332756, + "train/total_loss": 0.7080568075180054 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2496001273393631, - "train/contrastive_loss": 2.747602939605713, - "train/negative_loss": 2.24941349029541, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.49818935990333557, - "train/total_loss": 0.7991207242012024 + "train/classification_loss": 0.2958243787288666, + "train/contrastive_loss": 2.8103344440460205, + "train/negative_loss": 2.4228763580322266, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.38745805621147156, + "train/total_loss": 0.857891321182251 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21907085180282593, - "train/contrastive_loss": 3.1493043899536133, - "train/negative_loss": 1.6070890426635742, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.5422152280807495, - "train/total_loss": 0.8489317297935486 + "train/classification_loss": 0.1951732039451599, + "train/contrastive_loss": 2.352726697921753, + "train/negative_loss": 2.095808267593384, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.2569184899330139, + "train/total_loss": 0.6657185554504395 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.23483891785144806, - "train/contrastive_loss": 2.6074154376983643, - "train/negative_loss": 2.0748496055603027, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5325658321380615, - "train/total_loss": 0.7563220262527466 + "train/classification_loss": 0.264277845621109, + "train/contrastive_loss": 1.8340411186218262, + "train/negative_loss": 1.7576637268066406, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.07637742906808853, + "train/total_loss": 0.6310861110687256 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22905462980270386, - "train/contrastive_loss": 2.290233612060547, - "train/negative_loss": 1.495161533355713, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.7950721979141235, - "train/total_loss": 0.6871013641357422 + "train/classification_loss": 0.32850220799446106, + "train/contrastive_loss": 3.4041428565979004, + "train/negative_loss": 3.388155460357666, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.01598750427365303, + "train/total_loss": 1.0093307495117188 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2736884355545044, - "train/contrastive_loss": 1.2041869163513184, - "train/negative_loss": 1.0927543640136719, - "train/num_negatives": 46, + "train/classification_loss": 0.2550434172153473, + "train/contrastive_loss": 1.6375336647033691, + "train/negative_loss": 1.6250334978103638, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.012500218115746975, + "train/total_loss": 0.5825501680374146 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.291134774684906, + "train/contrastive_loss": 3.782825231552124, + "train/negative_loss": 3.4734084606170654, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.1114325299859047, - "train/total_loss": 0.514525830745697 + "train/positive_loss": 0.30941683053970337, + "train/total_loss": 1.0476998090744019 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24302174150943756, - "train/contrastive_loss": 1.6195422410964966, - "train/negative_loss": 1.6141878366470337, + "train/classification_loss": 0.19983667135238647, + "train/contrastive_loss": 1.3478055000305176, + "train/negative_loss": 1.2320120334625244, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.005354348570108414, - "train/total_loss": 0.5669301748275757 + "train/num_positives": 10, + "train/positive_loss": 0.11579342186450958, + "train/total_loss": 0.46939778327941895 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.22298429906368256, + "train/contrastive_loss": 3.5381340980529785, + "train/negative_loss": 2.65381121635437, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.8843229413032532, + "train/total_loss": 0.9306111335754395 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.28030794858932495, + "train/contrastive_loss": 1.4580556154251099, + "train/negative_loss": 1.4495916366577148, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.008464016020298004, + "train/total_loss": 0.5719190835952759 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22214101254940033, - "train/contrastive_loss": 1.2069236040115356, - "train/negative_loss": 1.0607675313949585, + "train/classification_loss": 0.27817320823669434, + "train/contrastive_loss": 1.6760679483413696, + "train/negative_loss": 1.6634886264801025, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.14615602791309357, - "train/total_loss": 0.4635257422924042 + "train/positive_loss": 0.012579305097460747, + "train/total_loss": 0.6133868098258972 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.23206402361392975, - "train/contrastive_loss": 1.6516309976577759, - "train/negative_loss": 1.5536240339279175, - "train/num_negatives": 36, + "train/classification_loss": 0.2633680999279022, + "train/contrastive_loss": 2.0351154804229736, + "train/negative_loss": 1.8000682592391968, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.23504719138145447, + "train/total_loss": 0.6703912019729614 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.3214731812477112, + "train/contrastive_loss": 3.6920042037963867, + "train/negative_loss": 3.0195672512054443, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.0980069637298584, - "train/total_loss": 0.5623902082443237 + "train/positive_loss": 0.6724368333816528, + "train/total_loss": 1.0598740577697754 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.28138458728790283, - "train/contrastive_loss": 1.7806702852249146, - "train/negative_loss": 1.3954497575759888, + "train/classification_loss": 0.22473084926605225, + "train/contrastive_loss": 2.4874930381774902, + "train/negative_loss": 1.979832649230957, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.507660448551178, + "train/total_loss": 0.7222294807434082 + }, + { + "epoch": 2.816901408450704, + "step": 800, + "train/classification_loss": 0.2553084194660187, + "train/contrastive_loss": 1.3869521617889404, + "train/negative_loss": 1.161912202835083, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.3852205276489258, - "train/total_loss": 0.6375186443328857 + "train/num_positives": 14, + "train/positive_loss": 0.22503989934921265, + "train/total_loss": 0.5326988697052002 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2305234670639038, - "train/contrastive_loss": 1.9142972230911255, - "train/negative_loss": 1.5349884033203125, + "train/classification_loss": 0.2978564202785492, + "train/contrastive_loss": 2.9334352016448975, + "train/negative_loss": 2.933372974395752, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.379308819770813, - "train/total_loss": 0.6133829355239868 + "train/num_positives": 2, + "train/positive_loss": 6.210996798472479e-05, + "train/total_loss": 0.8845434188842773 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.20945322513580322, - "train/contrastive_loss": 0.9568667411804199, - "train/negative_loss": 0.6745139360427856, + "train/classification_loss": 0.23521746695041656, + "train/contrastive_loss": 2.9775519371032715, + "train/negative_loss": 2.2168920040130615, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2823527753353119, - "train/total_loss": 0.4008265733718872 + "train/num_positives": 16, + "train/positive_loss": 0.7606600522994995, + "train/total_loss": 0.8307278752326965 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.3179333508014679, - "train/contrastive_loss": 1.602040410041809, - "train/negative_loss": 1.3344659805297852, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.2675744593143463, - "train/total_loss": 0.6383414268493652 + "train/classification_loss": 0.26708418130874634, + "train/contrastive_loss": 2.4387190341949463, + "train/negative_loss": 2.3446977138519287, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.09402133524417877, + "train/total_loss": 0.7548279762268066 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.1964346319437027, - "train/contrastive_loss": 1.3324331045150757, - "train/negative_loss": 1.331918478012085, - "train/num_negatives": 48, + "train/classification_loss": 0.29026615619659424, + "train/contrastive_loss": 0.9986672401428223, + "train/negative_loss": 0.9358220100402832, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0005146160256117582, - "train/total_loss": 0.46292126178741455 + "train/positive_loss": 0.06284521520137787, + "train/total_loss": 0.48999959230422974 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22980420291423798, - "train/contrastive_loss": 0.1973051130771637, - "train/negative_loss": 0.1444212645292282, + "train/classification_loss": 0.2614245116710663, + "train/contrastive_loss": 1.0351309776306152, + "train/negative_loss": 0.9160920977592468, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.05288384109735489, - "train/total_loss": 0.26926523447036743 + "train/num_positives": 14, + "train/positive_loss": 0.1190388947725296, + "train/total_loss": 0.46845072507858276 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.20481838285923004, - "train/contrastive_loss": 0.47898679971694946, - "train/negative_loss": 0.47255268692970276, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.006434099283069372, - "train/total_loss": 0.30061572790145874 + "train/classification_loss": 0.3408012390136719, + "train/contrastive_loss": 2.7718424797058105, + "train/negative_loss": 2.7475712299346924, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.02427135780453682, + "train/total_loss": 0.895169734954834 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2864845395088196, - "train/contrastive_loss": 0.622930645942688, - "train/negative_loss": 0.29827824234962463, - "train/num_negatives": 28, + "train/classification_loss": 0.20949704945087433, + "train/contrastive_loss": 1.3126007318496704, + "train/negative_loss": 1.0364757776260376, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.32465240359306335, - "train/total_loss": 0.41107067465782166 + "train/positive_loss": 0.2761249542236328, + "train/total_loss": 0.47201722860336304 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24819721281528473, - "train/contrastive_loss": 1.8811273574829102, - "train/negative_loss": 1.4011094570159912, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.48001784086227417, - "train/total_loss": 0.6244226694107056 + "train/classification_loss": 0.21531300246715546, + "train/contrastive_loss": 1.5455608367919922, + "train/negative_loss": 1.2875653505325317, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.25799551606178284, + "train/total_loss": 0.5244251489639282 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.22059552371501923, - "train/contrastive_loss": 1.1323555707931519, - "train/negative_loss": 1.1309107542037964, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0014448151923716068, - "train/total_loss": 0.44706663489341736 + "train/classification_loss": 0.24157361686229706, + "train/contrastive_loss": 1.898134469985962, + "train/negative_loss": 1.511379599571228, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3867548704147339, + "train/total_loss": 0.6212005019187927 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.23779799044132233, - "train/contrastive_loss": 1.8688530921936035, - "train/negative_loss": 1.018399715423584, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8504534363746643, - "train/total_loss": 0.6115686297416687 + "train/classification_loss": 0.2620825171470642, + "train/contrastive_loss": 2.258037567138672, + "train/negative_loss": 1.6570624113082886, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.6009751558303833, + "train/total_loss": 0.7136900424957275 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2630332112312317, - "train/contrastive_loss": 3.738659381866455, - "train/negative_loss": 2.6653177738189697, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.0733416080474854, - "train/total_loss": 1.0107650756835938 + "train/classification_loss": 0.2702169120311737, + "train/contrastive_loss": 3.007739305496216, + "train/negative_loss": 2.9511866569519043, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.05655274540185928, + "train/total_loss": 0.8717647790908813 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24286679923534393, - "train/contrastive_loss": 1.403984546661377, - "train/negative_loss": 0.7279723882675171, + "train/classification_loss": 0.21575193107128143, + "train/contrastive_loss": 0.4348738491535187, + "train/negative_loss": 0.42594432830810547, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.6760120987892151, - "train/total_loss": 0.5236636996269226 + "train/num_positives": 16, + "train/positive_loss": 0.008929528295993805, + "train/total_loss": 0.302726686000824 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21834634244441986, - "train/contrastive_loss": 4.401450157165527, - "train/negative_loss": 2.8194596767425537, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5819905996322632, - "train/total_loss": 1.0986363887786865 + "train/classification_loss": 0.24968865513801575, + "train/contrastive_loss": 2.4363017082214355, + "train/negative_loss": 1.8530491590499878, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.5832524299621582, + "train/total_loss": 0.7369489669799805 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2829046845436096, - "train/contrastive_loss": 1.88767409324646, - "train/negative_loss": 1.396070122718811, + "train/classification_loss": 0.29271823167800903, + "train/contrastive_loss": 2.594679117202759, + "train/negative_loss": 2.2339677810668945, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.49160394072532654, - "train/total_loss": 0.6604394912719727 + "train/num_positives": 2, + "train/positive_loss": 0.3607114255428314, + "train/total_loss": 0.8116540908813477 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.25014060735702515, - "train/contrastive_loss": 2.5583932399749756, - "train/negative_loss": 2.4485936164855957, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.10979965329170227, - "train/total_loss": 0.7618192434310913 + "train/classification_loss": 0.20150186121463776, + "train/contrastive_loss": 2.305906295776367, + "train/negative_loss": 1.461719036102295, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8441872000694275, + "train/total_loss": 0.6626831293106079 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21148306131362915, - "train/contrastive_loss": 1.9780609607696533, - "train/negative_loss": 1.211673617362976, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7663873434066772, - "train/total_loss": 0.6070952415466309 + "train/classification_loss": 0.2527795135974884, + "train/contrastive_loss": 2.8478028774261475, + "train/negative_loss": 2.579000234603882, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.26880255341529846, + "train/total_loss": 0.8223401308059692 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.23420943319797516, - "train/contrastive_loss": 2.3123865127563477, - "train/negative_loss": 1.3051868677139282, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.0071996450424194, - "train/total_loss": 0.6966867446899414 + "train/classification_loss": 0.27862924337387085, + "train/contrastive_loss": 1.8087778091430664, + "train/negative_loss": 1.5379607677459717, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.2708171010017395, + "train/total_loss": 0.6403847932815552 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2563985288143158, - "train/contrastive_loss": 3.7002785205841064, - "train/negative_loss": 3.071199417114258, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.6290791630744934, - "train/total_loss": 0.9964542388916016 + "train/classification_loss": 0.24101270735263824, + "train/contrastive_loss": 4.855133533477783, + "train/negative_loss": 4.8550944328308105, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 3.922153700841591e-05, + "train/total_loss": 1.2120394706726074 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2633938491344452, - "train/contrastive_loss": 3.086589813232422, - "train/negative_loss": 1.7845187187194824, + "train/classification_loss": 0.2651229798793793, + "train/contrastive_loss": 1.641740083694458, + "train/negative_loss": 1.5914775133132935, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.302071213722229, - "train/total_loss": 0.8807117938995361 + "train/positive_loss": 0.05026261880993843, + "train/total_loss": 0.5934709906578064 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.24562089145183563, - "train/contrastive_loss": 0.7776539921760559, - "train/negative_loss": 0.7740696668624878, + "train/classification_loss": 0.2658005952835083, + "train/contrastive_loss": 2.2454192638397217, + "train/negative_loss": 1.7501306533813477, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0035842983052134514, - "train/total_loss": 0.4011516869068146 + "train/num_positives": 8, + "train/positive_loss": 0.4952886998653412, + "train/total_loss": 0.7148844599723816 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21240472793579102, - "train/contrastive_loss": 1.5633504390716553, - "train/negative_loss": 1.2499130964279175, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.3134373128414154, - "train/total_loss": 0.52507483959198 + "train/classification_loss": 0.2068278044462204, + "train/contrastive_loss": 2.4670262336730957, + "train/negative_loss": 2.3775181770324707, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.08950802683830261, + "train/total_loss": 0.7002330422401428 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.2507259249687195, - "train/contrastive_loss": 1.0289647579193115, - "train/negative_loss": 0.992626965045929, - "train/num_negatives": 46, + "train/classification_loss": 0.28742626309394836, + "train/contrastive_loss": 2.058751106262207, + "train/negative_loss": 1.9918733835220337, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.03633779287338257, - "train/total_loss": 0.45651888847351074 + "train/positive_loss": 0.0668778270483017, + "train/total_loss": 0.6991764903068542 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.3053416609764099, - "train/contrastive_loss": 2.0837440490722656, - "train/negative_loss": 2.0837440490722656, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.722090482711792 - }, - { - "epoch": 3.041825095057034, - "eval_exact_match_accuracy": 0.08, - "eval_hamming_loss": 0.08582633053221289, - "eval_loss": 0.6270034909248352, - "eval_macro_f1": 0.04236694677871149, - "eval_macro_precision": 0.055175558595531235, - "eval_macro_recall": 0.034384768400113674, - "eval_micro_f1": 0.2400793650793651, - "eval_micro_precision": 0.937984496124031, - "eval_micro_recall": 0.13765642775881684, - "eval_runtime": 2.6316, - "eval_samples_per_second": 199.496, - "eval_steps_per_second": 25.08, + "train/classification_loss": 0.2809467315673828, + "train/contrastive_loss": 2.4301342964172363, + "train/negative_loss": 2.245181083679199, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.18495316803455353, + "train/total_loss": 0.766973614692688 + }, + { + "epoch": 2.816901408450704, + "eval_exact_match_accuracy": 0.07583774250440917, + "eval_hamming_loss": 0.08828716671853927, + "eval_loss": 0.7093353271484375, + "eval_macro_f1": 0.039402468066681094, + "eval_macro_precision": 0.11255656108597284, + "eval_macro_recall": 0.02976965672190796, + "eval_micro_f1": 0.1840843720038351, + "eval_micro_precision": 0.9142857142857143, + "eval_micro_recall": 0.1023454157782516, + "eval_runtime": 2.8396, + "eval_samples_per_second": 199.677, + "eval_steps_per_second": 25.004, "step": 800 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.23720505833625793, - "train/contrastive_loss": 1.2245107889175415, - "train/negative_loss": 1.0856430530548096, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.13886773586273193, - "train/total_loss": 0.4821072220802307 + "train/classification_loss": 0.252003937959671, + "train/contrastive_loss": 1.3974590301513672, + "train/negative_loss": 0.8496163487434387, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.5478426814079285, + "train/total_loss": 0.5314957499504089 }, { - "epoch": 3.041825095057034, + "epoch": 2.816901408450704, "step": 800, - "train/classification_loss": 0.21708717942237854, - "train/contrastive_loss": 1.2170062065124512, - "train/negative_loss": 1.0375351905822754, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.1794710010290146, - "train/total_loss": 0.4604884386062622 + "train/classification_loss": 0.2942037880420685, + "train/contrastive_loss": 1.0723258256912231, + "train/negative_loss": 0.9051344990730286, + "train/num_negatives": 42, + "train/num_positives": 6, + "train/positive_loss": 0.16719137132167816, + "train/total_loss": 0.5086689591407776 }, { - "epoch": 3.2319391634980987, - "grad_norm": 15.560242652893066, - "learning_rate": 1.9886301369863014e-05, - "loss": 1.0131, + "epoch": 2.992957746478873, + "grad_norm": 9.401230812072754, + "learning_rate": 1.9894855532064835e-05, + "loss": 1.0828, "step": 850 }, { - "epoch": 3.2319391634980987, + "epoch": 2.992957746478873, "step": 850, - "train/classification_loss": 0.1870625913143158, - "train/contrastive_loss": 1.5270297527313232, - "train/negative_loss": 1.4863094091415405, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 0.040720295161008835, - "train/total_loss": 0.49246853590011597 + "train/classification_loss": 0.27011895179748535, + "train/contrastive_loss": 1.1434996128082275, + "train/negative_loss": 0.8881341814994812, + "train/num_negatives": 38, + "train/num_positives": 18, + "train/positive_loss": 0.2553654611110687, + "train/total_loss": 0.49881887435913086 }, { - "epoch": 3.2319391634980987, + "epoch": 2.992957746478873, "step": 850, - "train/classification_loss": 0.24762944877147675, - "train/contrastive_loss": 2.3403139114379883, - "train/negative_loss": 2.015127658843994, - "train/num_negatives": 24, - "train/num_positives": 32, - "train/positive_loss": 0.3251863121986389, - "train/total_loss": 0.7156922221183777 + "train/classification_loss": 0.2618882954120636, + "train/contrastive_loss": 0.9530047178268433, + "train/negative_loss": 0.7438822984695435, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.2091224193572998, + "train/total_loss": 0.4524892568588257 }, { - "epoch": 3.4220532319391634, - "grad_norm": 14.150642395019531, - "learning_rate": 1.9878691019786912e-05, - "loss": 1.0233, + "epoch": 3.169014084507042, + "grad_norm": 12.180469512939453, + "learning_rate": 1.9887808315715293e-05, + "loss": 1.0268, "step": 900 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2884199619293213, - "train/contrastive_loss": 1.7027394771575928, - "train/negative_loss": 0.40594401955604553, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.2967954874038696, - "train/total_loss": 0.6289678812026978 + "train/classification_loss": 0.25358226895332336, + "train/contrastive_loss": 1.9923863410949707, + "train/negative_loss": 1.7963001728057861, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.1960861086845398, + "train/total_loss": 0.6520595550537109 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.26056575775146484, - "train/contrastive_loss": 2.1305618286132812, - "train/negative_loss": 1.454452633857727, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.6761090755462646, - "train/total_loss": 0.6866781711578369 + "train/classification_loss": 0.33721333742141724, + "train/contrastive_loss": 1.2469919919967651, + "train/negative_loss": 1.0868885517120361, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.1601034700870514, + "train/total_loss": 0.5866117477416992 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.20876652002334595, - "train/contrastive_loss": 2.6527113914489746, - "train/negative_loss": 1.0051575899124146, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.6475539207458496, - "train/total_loss": 0.7393088340759277 + "train/classification_loss": 0.2690930664539337, + "train/contrastive_loss": 2.7295455932617188, + "train/negative_loss": 1.2594517469406128, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.4700939655303955, + "train/total_loss": 0.8150022029876709 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.22139424085617065, - "train/contrastive_loss": 2.723538875579834, - "train/negative_loss": 2.0466833114624023, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.6768556237220764, - "train/total_loss": 0.7661020159721375 + "train/classification_loss": 0.18621936440467834, + "train/contrastive_loss": 1.6868665218353271, + "train/negative_loss": 1.5004374980926514, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.18642906844615936, + "train/total_loss": 0.5235927104949951 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.22995351254940033, - "train/contrastive_loss": 1.4709346294403076, - "train/negative_loss": 1.0557533502578735, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.4151812493801117, - "train/total_loss": 0.5241404175758362 + "train/classification_loss": 0.2418345808982849, + "train/contrastive_loss": 3.0100104808807373, + "train/negative_loss": 2.782055139541626, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.22795523703098297, + "train/total_loss": 0.8438366651535034 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23638282716274261, - "train/contrastive_loss": 2.1670122146606445, - "train/negative_loss": 1.4138766527175903, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.7531355619430542, - "train/total_loss": 0.6697852611541748 + "train/classification_loss": 0.25583726167678833, + "train/contrastive_loss": 2.327380418777466, + "train/negative_loss": 1.7409801483154297, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.5864002704620361, + "train/total_loss": 0.7213133573532104 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.28841862082481384, - "train/contrastive_loss": 1.3055506944656372, - "train/negative_loss": 0.9987215399742126, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.30682915449142456, - "train/total_loss": 0.5495287775993347 + "train/classification_loss": 0.2349979132413864, + "train/contrastive_loss": 1.4303185939788818, + "train/negative_loss": 0.9587671756744385, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.47155144810676575, + "train/total_loss": 0.5210616588592529 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.19768036901950836, - "train/contrastive_loss": 1.924098253250122, - "train/negative_loss": 1.3412444591522217, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5828537940979004, - "train/total_loss": 0.5825000405311584 + "train/classification_loss": 0.2661401629447937, + "train/contrastive_loss": 0.7526309490203857, + "train/negative_loss": 0.7526141405105591, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 1.6808651707833633e-05, + "train/total_loss": 0.4166663587093353 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.20158839225769043, - "train/contrastive_loss": 1.7283940315246582, - "train/negative_loss": 1.4879553318023682, + "train/classification_loss": 0.20879028737545013, + "train/contrastive_loss": 0.8466865420341492, + "train/negative_loss": 0.8190524578094482, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.24043869972229004, - "train/total_loss": 0.5472671985626221 + "train/positive_loss": 0.027634065598249435, + "train/total_loss": 0.3781276047229767 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.31219038367271423, - "train/contrastive_loss": 3.476602554321289, - "train/negative_loss": 1.8385814428329468, + "train/classification_loss": 0.270837664604187, + "train/contrastive_loss": 3.236480712890625, + "train/negative_loss": 2.2038185596466064, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.6380212306976318, - "train/total_loss": 1.0075109004974365 - }, - { - "epoch": 3.4220532319391634, - "step": 900, - "train/classification_loss": 0.2300805151462555, - "train/contrastive_loss": 1.8227320909500122, - "train/negative_loss": 1.3775594234466553, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.4451726973056793, - "train/total_loss": 0.5946269035339355 + "train/num_positives": 14, + "train/positive_loss": 1.032662034034729, + "train/total_loss": 0.9181337952613831 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.18706543743610382, - "train/contrastive_loss": 1.6546471118927002, - "train/negative_loss": 1.0098271369934082, - "train/num_negatives": 44, + "train/classification_loss": 0.21749143302440643, + "train/contrastive_loss": 1.2317242622375488, + "train/negative_loss": 1.160201072692871, + "train/num_negatives": 38, "train/num_positives": 12, - "train/positive_loss": 0.6448199152946472, - "train/total_loss": 0.5179948806762695 + "train/positive_loss": 0.07152324914932251, + "train/total_loss": 0.46383628249168396 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.26599833369255066, - "train/contrastive_loss": 3.1422245502471924, - "train/negative_loss": 2.2718989849090576, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8703255653381348, - "train/total_loss": 0.8944432735443115 + "train/classification_loss": 0.2534635663032532, + "train/contrastive_loss": 1.7865002155303955, + "train/negative_loss": 1.6147598028182983, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.17174047231674194, + "train/total_loss": 0.6107636094093323 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.20419970154762268, - "train/contrastive_loss": 1.8180824518203735, - "train/negative_loss": 1.8106420040130615, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.007440468296408653, - "train/total_loss": 0.5678161978721619 + "train/classification_loss": 0.2502749264240265, + "train/contrastive_loss": 4.4567742347717285, + "train/negative_loss": 2.673809051513672, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.7829651832580566, + "train/total_loss": 1.1416298151016235 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.19163630902767181, - "train/contrastive_loss": 1.9224039316177368, - "train/negative_loss": 1.4235929250717163, + "train/classification_loss": 0.27925580739974976, + "train/contrastive_loss": 1.762145757675171, + "train/negative_loss": 1.72877037525177, "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.4988109767436981, - "train/total_loss": 0.5761170983314514 + "train/num_positives": 4, + "train/positive_loss": 0.033375371247529984, + "train/total_loss": 0.6316849589347839 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.205983504652977, - "train/contrastive_loss": 0.7068548202514648, - "train/negative_loss": 0.5902347564697266, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.11662005633115768, - "train/total_loss": 0.3473544716835022 + "train/classification_loss": 0.17603686451911926, + "train/contrastive_loss": 2.4854531288146973, + "train/negative_loss": 1.1680917739868164, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.3173613548278809, + "train/total_loss": 0.6731275320053101 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.27658966183662415, - "train/contrastive_loss": 2.699770450592041, - "train/negative_loss": 1.5192842483520508, - "train/num_negatives": 40, + "train/classification_loss": 0.24764235317707062, + "train/contrastive_loss": 1.7742722034454346, + "train/negative_loss": 0.775140643119812, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 1.1804862022399902, - "train/total_loss": 0.8165438175201416 + "train/positive_loss": 0.9991315007209778, + "train/total_loss": 0.6024968028068542 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.26495087146759033, - "train/contrastive_loss": 1.8526464700698853, - "train/negative_loss": 0.7606337070465088, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.0920127630233765, - "train/total_loss": 0.6354801654815674 + "train/classification_loss": 0.21514207124710083, + "train/contrastive_loss": 1.61635160446167, + "train/negative_loss": 1.422782063484192, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.19356957077980042, + "train/total_loss": 0.5384123921394348 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2666418254375458, - "train/contrastive_loss": 1.604782223701477, - "train/negative_loss": 1.6031246185302734, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0016576036578044295, - "train/total_loss": 0.5875982642173767 + "train/classification_loss": 0.2396659255027771, + "train/contrastive_loss": 2.763972043991089, + "train/negative_loss": 2.73207688331604, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.03189517930150032, + "train/total_loss": 0.7924603223800659 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.21139425039291382, - "train/contrastive_loss": 3.329662322998047, - "train/negative_loss": 1.7238447666168213, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.6058175563812256, - "train/total_loss": 0.8773267269134521 + "train/classification_loss": 0.2650146186351776, + "train/contrastive_loss": 2.48262357711792, + "train/negative_loss": 2.475081205368042, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.007542412728071213, + "train/total_loss": 0.7615393400192261 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2829303741455078, - "train/contrastive_loss": 2.372310161590576, - "train/negative_loss": 1.0686851739883423, - "train/num_negatives": 44, + "train/classification_loss": 0.21354293823242188, + "train/contrastive_loss": 2.597524881362915, + "train/negative_loss": 2.4310214519500732, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.16650345921516418, + "train/total_loss": 0.7330479025840759 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.20551535487174988, + "train/contrastive_loss": 1.978804588317871, + "train/negative_loss": 1.85262131690979, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3036249876022339, - "train/total_loss": 0.757392406463623 + "train/positive_loss": 0.12618324160575867, + "train/total_loss": 0.6012762784957886 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2936272919178009, - "train/contrastive_loss": 1.4977996349334717, - "train/negative_loss": 1.3882708549499512, - "train/num_negatives": 44, + "train/classification_loss": 0.18886318802833557, + "train/contrastive_loss": 2.2895596027374268, + "train/negative_loss": 2.266066789627075, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.10952875018119812, - "train/total_loss": 0.5931872129440308 + "train/positive_loss": 0.023492876440286636, + "train/total_loss": 0.6467751264572144 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.18749801814556122, - "train/contrastive_loss": 0.4284825325012207, - "train/negative_loss": 0.27766361832618713, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.15081891417503357, - "train/total_loss": 0.2731945216655731 + "train/classification_loss": 0.2466670721769333, + "train/contrastive_loss": 1.8031994104385376, + "train/negative_loss": 1.6978203058242798, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.105379119515419, + "train/total_loss": 0.607306957244873 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.18596063554286957, - "train/contrastive_loss": 1.4042861461639404, - "train/negative_loss": 0.529106080532074, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.8751800656318665, - "train/total_loss": 0.46681785583496094 + "train/classification_loss": 0.2870582640171051, + "train/contrastive_loss": 2.804509162902832, + "train/negative_loss": 1.702981948852539, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.1015270948410034, + "train/total_loss": 0.8479601144790649 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.16890466213226318, - "train/contrastive_loss": 1.873727560043335, - "train/negative_loss": 1.2047364711761475, + "train/classification_loss": 0.24687239527702332, + "train/contrastive_loss": 1.1275032758712769, + "train/negative_loss": 0.9102397561073303, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6689910888671875, - "train/total_loss": 0.5436501502990723 + "train/num_positives": 10, + "train/positive_loss": 0.21726350486278534, + "train/total_loss": 0.4723730683326721 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2848966419696808, - "train/contrastive_loss": 1.94826340675354, - "train/negative_loss": 0.5879778861999512, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3602855205535889, - "train/total_loss": 0.6745493412017822 + "train/classification_loss": 0.23745234310626984, + "train/contrastive_loss": 2.7406063079833984, + "train/negative_loss": 2.04325532913208, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.6973509192466736, + "train/total_loss": 0.7855736017227173 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2771223187446594, - "train/contrastive_loss": 1.5875213146209717, - "train/negative_loss": 1.4872550964355469, + "train/classification_loss": 0.26930058002471924, + "train/contrastive_loss": 2.458677053451538, + "train/negative_loss": 2.4018378257751465, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1002662181854248, - "train/total_loss": 0.5946265459060669 + "train/num_positives": 4, + "train/positive_loss": 0.056839242577552795, + "train/total_loss": 0.7610360383987427 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.25248628854751587, - "train/contrastive_loss": 2.253152370452881, - "train/negative_loss": 1.7610868215560913, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.4920654296875, - "train/total_loss": 0.703116774559021 + "train/classification_loss": 0.2535470426082611, + "train/contrastive_loss": 1.8438407182693481, + "train/negative_loss": 1.6169536113739014, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.22688713669776917, + "train/total_loss": 0.6223151683807373 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.24282366037368774, - "train/contrastive_loss": 0.7144203782081604, - "train/negative_loss": 0.700264573097229, - "train/num_negatives": 40, + "train/classification_loss": 0.2579350769519806, + "train/contrastive_loss": 3.7865653038024902, + "train/negative_loss": 1.6754318475723267, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.014155827462673187, - "train/total_loss": 0.3857077360153198 + "train/positive_loss": 2.111133337020874, + "train/total_loss": 1.01524817943573 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.26402249932289124, - "train/contrastive_loss": 3.083613872528076, - "train/negative_loss": 1.9977576732635498, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 1.0858560800552368, - "train/total_loss": 0.8807452917098999 + "train/classification_loss": 0.2838534116744995, + "train/contrastive_loss": 1.2872849702835083, + "train/negative_loss": 1.2478972673416138, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.03938775882124901, + "train/total_loss": 0.5413104295730591 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23431912064552307, - "train/contrastive_loss": 2.2615771293640137, - "train/negative_loss": 1.0778124332427979, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.1837645769119263, - "train/total_loss": 0.6866345405578613 + "train/classification_loss": 0.2081357091665268, + "train/contrastive_loss": 2.1145899295806885, + "train/negative_loss": 2.11407470703125, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0005153264501132071, + "train/total_loss": 0.6310536861419678 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2527828514575958, - "train/contrastive_loss": 2.9366235733032227, - "train/negative_loss": 1.6605578660964966, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2760658264160156, - "train/total_loss": 0.8401075601577759 + "train/classification_loss": 0.23127244412899017, + "train/contrastive_loss": 2.789837598800659, + "train/negative_loss": 2.005688428878784, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7841491103172302, + "train/total_loss": 0.7892400026321411 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.30766230821609497, - "train/contrastive_loss": 1.084456443786621, - "train/negative_loss": 1.0800565481185913, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.004399845376610756, - "train/total_loss": 0.5245535969734192 + "train/classification_loss": 0.2362528145313263, + "train/contrastive_loss": 1.9099745750427246, + "train/negative_loss": 1.3928916454315186, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5170829892158508, + "train/total_loss": 0.6182477474212646 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2623668909072876, - "train/contrastive_loss": 2.782198429107666, - "train/negative_loss": 1.8324925899505615, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.9497058391571045, - "train/total_loss": 0.8188065886497498 + "train/classification_loss": 0.259905606508255, + "train/contrastive_loss": 1.8167695999145508, + "train/negative_loss": 1.674485206604004, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.14228445291519165, + "train/total_loss": 0.6232595443725586 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2475764900445938, - "train/contrastive_loss": 3.036393880844116, - "train/negative_loss": 2.192603349685669, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8437905311584473, - "train/total_loss": 0.8548552393913269 + "train/classification_loss": 0.28814688324928284, + "train/contrastive_loss": 2.8386669158935547, + "train/negative_loss": 2.108210802078247, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.7304562330245972, + "train/total_loss": 0.8558802604675293 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2105812132358551, - "train/contrastive_loss": 2.8463809490203857, - "train/negative_loss": 1.2267394065856934, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.6196415424346924, - "train/total_loss": 0.7798573970794678 + "train/classification_loss": 0.18821392953395844, + "train/contrastive_loss": 1.8747836351394653, + "train/negative_loss": 1.8118003606796265, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.06298328191041946, + "train/total_loss": 0.5631706714630127 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.22166648507118225, - "train/contrastive_loss": 2.546171188354492, - "train/negative_loss": 1.9343057870864868, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.6118652820587158, - "train/total_loss": 0.730900764465332 + "train/classification_loss": 0.26654890179634094, + "train/contrastive_loss": 1.9006266593933105, + "train/negative_loss": 1.1798664331436157, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.7207602262496948, + "train/total_loss": 0.6466742753982544 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2266550362110138, - "train/contrastive_loss": 2.9490723609924316, - "train/negative_loss": 1.3982170820236206, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.5508551597595215, - "train/total_loss": 0.8164695501327515 + "train/classification_loss": 0.319775253534317, + "train/contrastive_loss": 1.3892217874526978, + "train/negative_loss": 1.3537771701812744, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.035444606095552444, + "train/total_loss": 0.5976196527481079 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2725416123867035, - "train/contrastive_loss": 2.175379753112793, - "train/negative_loss": 1.920516848564148, - "train/num_negatives": 46, + "train/classification_loss": 0.24637575447559357, + "train/contrastive_loss": 0.6561765670776367, + "train/negative_loss": 0.6435545682907104, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.012622025795280933, + "train/total_loss": 0.37761107087135315 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.2969827950000763, + "train/contrastive_loss": 3.5329229831695557, + "train/negative_loss": 2.3411078453063965, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.25486278533935547, - "train/total_loss": 0.7076175808906555 + "train/positive_loss": 1.1918151378631592, + "train/total_loss": 1.0035674571990967 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2377607673406601, - "train/contrastive_loss": 1.8378353118896484, - "train/negative_loss": 1.8275729417800903, + "train/classification_loss": 0.18902000784873962, + "train/contrastive_loss": 0.9614936113357544, + "train/negative_loss": 0.7187949419021606, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.01026233658194542, - "train/total_loss": 0.605327844619751 + "train/num_positives": 10, + "train/positive_loss": 0.24269866943359375, + "train/total_loss": 0.38131874799728394 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.2200397104024887, + "train/contrastive_loss": 3.7696337699890137, + "train/negative_loss": 3.1244354248046875, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.6451984643936157, + "train/total_loss": 0.9739664793014526 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.27559593319892883, + "train/contrastive_loss": 1.152921438217163, + "train/negative_loss": 1.1186774969100952, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.03424391895532608, + "train/total_loss": 0.5061802268028259 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2134542316198349, - "train/contrastive_loss": 1.0046383142471313, - "train/negative_loss": 0.9999704360961914, + "train/classification_loss": 0.28067702054977417, + "train/contrastive_loss": 1.3491246700286865, + "train/negative_loss": 1.0117920637130737, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.004667932167649269, - "train/total_loss": 0.41438189148902893 + "train/positive_loss": 0.337332546710968, + "train/total_loss": 0.5505019426345825 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.22166688740253448, - "train/contrastive_loss": 1.5197139978408813, - "train/negative_loss": 1.492210865020752, - "train/num_negatives": 36, + "train/classification_loss": 0.25605034828186035, + "train/contrastive_loss": 1.8900290727615356, + "train/negative_loss": 1.779759407043457, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.11026965826749802, + "train/total_loss": 0.6340562105178833 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.31310468912124634, + "train/contrastive_loss": 2.294672966003418, + "train/negative_loss": 1.685768723487854, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.02750312350690365, - "train/total_loss": 0.5256096720695496 + "train/positive_loss": 0.6089043021202087, + "train/total_loss": 0.7720392942428589 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.27137479186058044, - "train/contrastive_loss": 1.7408751249313354, - "train/negative_loss": 1.6375616788864136, + "train/classification_loss": 0.22021882236003876, + "train/contrastive_loss": 2.3119664192199707, + "train/negative_loss": 1.7251931428909302, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5867732167243958, + "train/total_loss": 0.6826121211051941 + }, + { + "epoch": 3.169014084507042, + "step": 900, + "train/classification_loss": 0.2507193088531494, + "train/contrastive_loss": 1.7474128007888794, + "train/negative_loss": 1.2832971811294556, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.10331346094608307, - "train/total_loss": 0.6195498108863831 + "train/num_positives": 14, + "train/positive_loss": 0.4641156494617462, + "train/total_loss": 0.6002018451690674 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2253185510635376, - "train/contrastive_loss": 2.4471449851989746, - "train/negative_loss": 1.957360029220581, + "train/classification_loss": 0.29070261120796204, + "train/contrastive_loss": 3.328002452850342, + "train/negative_loss": 3.3279781341552734, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.489784836769104, - "train/total_loss": 0.7147475481033325 + "train/num_positives": 2, + "train/positive_loss": 2.4318991563632153e-05, + "train/total_loss": 0.9563031196594238 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.19799432158470154, - "train/contrastive_loss": 1.4412987232208252, - "train/negative_loss": 0.7746102809906006, + "train/classification_loss": 0.22610525786876678, + "train/contrastive_loss": 2.796560049057007, + "train/negative_loss": 1.909249186515808, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6666883826255798, - "train/total_loss": 0.4862540662288666 + "train/num_positives": 16, + "train/positive_loss": 0.8873108625411987, + "train/total_loss": 0.7854173183441162 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.3153323829174042, - "train/contrastive_loss": 1.312953233718872, - "train/negative_loss": 1.2650680541992188, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.04788517206907272, - "train/total_loss": 0.577923059463501 + "train/classification_loss": 0.25967052578926086, + "train/contrastive_loss": 2.43886137008667, + "train/negative_loss": 2.076239824295044, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.3626216650009155, + "train/total_loss": 0.7474428415298462 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.18470340967178345, - "train/contrastive_loss": 1.1026957035064697, - "train/negative_loss": 1.1025346517562866, - "train/num_negatives": 48, + "train/classification_loss": 0.2802373766899109, + "train/contrastive_loss": 0.8633297681808472, + "train/negative_loss": 0.6441264152526855, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.00016109902935568243, - "train/total_loss": 0.40524256229400635 + "train/positive_loss": 0.21920333802700043, + "train/total_loss": 0.4529033303260803 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2154005914926529, - "train/contrastive_loss": 0.09103500843048096, - "train/negative_loss": 0.08670936524868011, + "train/classification_loss": 0.2545483112335205, + "train/contrastive_loss": 1.4053995609283447, + "train/negative_loss": 1.0480958223342896, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.00432564364746213, - "train/total_loss": 0.23360759019851685 + "train/num_positives": 14, + "train/positive_loss": 0.3573037385940552, + "train/total_loss": 0.5356281995773315 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.1958092600107193, - "train/contrastive_loss": 1.329616904258728, - "train/negative_loss": 1.1766525506973267, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.15296435356140137, - "train/total_loss": 0.4617326259613037 + "train/classification_loss": 0.3251075744628906, + "train/contrastive_loss": 1.5251171588897705, + "train/negative_loss": 1.2969127893447876, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.2282043993473053, + "train/total_loss": 0.6301310062408447 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2695102095603943, - "train/contrastive_loss": 0.5185620784759521, - "train/negative_loss": 0.3689654767513275, - "train/num_negatives": 28, + "train/classification_loss": 0.20154227316379547, + "train/contrastive_loss": 0.8990278840065002, + "train/negative_loss": 0.8234050273895264, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.14959660172462463, - "train/total_loss": 0.37322261929512024 + "train/positive_loss": 0.07562287896871567, + "train/total_loss": 0.3813478350639343 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.240237295627594, - "train/contrastive_loss": 2.704345464706421, - "train/negative_loss": 1.5245238542556763, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1798216104507446, - "train/total_loss": 0.7811064124107361 + "train/classification_loss": 0.20155936479568481, + "train/contrastive_loss": 1.091333031654358, + "train/negative_loss": 0.9378836154937744, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.15344937145709991, + "train/total_loss": 0.4198259711265564 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.21846488118171692, - "train/contrastive_loss": 1.1628711223602295, - "train/negative_loss": 1.1619595289230347, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0009115896536968648, - "train/total_loss": 0.4510391056537628 + "train/classification_loss": 0.23542320728302002, + "train/contrastive_loss": 1.8291407823562622, + "train/negative_loss": 1.4410908222198486, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.38804998993873596, + "train/total_loss": 0.6012513637542725 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.22590331733226776, - "train/contrastive_loss": 1.5970524549484253, - "train/negative_loss": 0.922641396522522, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6744110584259033, - "train/total_loss": 0.545313835144043 + "train/classification_loss": 0.25759339332580566, + "train/contrastive_loss": 2.8283519744873047, + "train/negative_loss": 1.410085678100586, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.4182664155960083, + "train/total_loss": 0.8232638239860535 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2493298202753067, - "train/contrastive_loss": 2.594031810760498, - "train/negative_loss": 1.814749836921692, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7792820930480957, - "train/total_loss": 0.768136203289032 + "train/classification_loss": 0.2626960575580597, + "train/contrastive_loss": 2.476795196533203, + "train/negative_loss": 2.470823287963867, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.0059718117117881775, + "train/total_loss": 0.7580550909042358 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23647107183933258, - "train/contrastive_loss": 2.3509132862091064, - "train/negative_loss": 0.967637836933136, + "train/classification_loss": 0.20553740859031677, + "train/contrastive_loss": 0.3179081082344055, + "train/negative_loss": 0.2770361602306366, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.3832753896713257, - "train/total_loss": 0.7066537141799927 + "train/num_positives": 16, + "train/positive_loss": 0.04087194427847862, + "train/total_loss": 0.2691190242767334 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.21313820779323578, - "train/contrastive_loss": 4.238811492919922, - "train/negative_loss": 2.565220594406128, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.6735906600952148, - "train/total_loss": 1.0609004497528076 + "train/classification_loss": 0.24472014605998993, + "train/contrastive_loss": 3.0500593185424805, + "train/negative_loss": 2.091676950454712, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.958382248878479, + "train/total_loss": 0.8547320365905762 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.27565082907676697, - "train/contrastive_loss": 2.3154749870300293, - "train/negative_loss": 1.8508058786392212, + "train/classification_loss": 0.293016254901886, + "train/contrastive_loss": 2.809427261352539, + "train/negative_loss": 1.9499094486236572, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.4646691679954529, - "train/total_loss": 0.7387458086013794 + "train/num_positives": 2, + "train/positive_loss": 0.8595178127288818, + "train/total_loss": 0.8549017310142517 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.24541905522346497, - "train/contrastive_loss": 2.5290298461914062, - "train/negative_loss": 2.377532720565796, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.15149712562561035, - "train/total_loss": 0.7512249946594238 + "train/classification_loss": 0.19498024880886078, + "train/contrastive_loss": 1.9063409566879272, + "train/negative_loss": 1.4219688177108765, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.4843721389770508, + "train/total_loss": 0.5762484669685364 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.21160700917243958, - "train/contrastive_loss": 1.985539436340332, - "train/negative_loss": 1.2527992725372314, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7327402234077454, - "train/total_loss": 0.6087149381637573 + "train/classification_loss": 0.24755001068115234, + "train/contrastive_loss": 2.495579242706299, + "train/negative_loss": 2.300785779953003, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.19479335844516754, + "train/total_loss": 0.7466658353805542 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23270884156227112, - "train/contrastive_loss": 2.2597241401672363, - "train/negative_loss": 1.7296522855758667, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5300719738006592, - "train/total_loss": 0.684653639793396 + "train/classification_loss": 0.2649572491645813, + "train/contrastive_loss": 1.0680320262908936, + "train/negative_loss": 0.9751583933830261, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.09287359565496445, + "train/total_loss": 0.47856366634368896 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.24587783217430115, - "train/contrastive_loss": 4.310778617858887, - "train/negative_loss": 3.019174098968506, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.2916043996810913, - "train/total_loss": 1.108033537864685 + "train/classification_loss": 0.23454870283603668, + "train/contrastive_loss": 5.323813438415527, + "train/negative_loss": 5.323805809020996, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 7.486403319489909e-06, + "train/total_loss": 1.2993113994598389 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.26149657368659973, - "train/contrastive_loss": 3.273616313934326, - "train/negative_loss": 1.9373950958251953, + "train/classification_loss": 0.25739285349845886, + "train/contrastive_loss": 1.1266157627105713, + "train/negative_loss": 0.8640680909156799, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3362210988998413, - "train/total_loss": 0.9162198305130005 + "train/positive_loss": 0.26254770159721375, + "train/total_loss": 0.48271602392196655 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23799464106559753, - "train/contrastive_loss": 0.8205082416534424, - "train/negative_loss": 0.8184356689453125, + "train/classification_loss": 0.2637128531932831, + "train/contrastive_loss": 1.78715181350708, + "train/negative_loss": 1.5449166297912598, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.002072566654533148, - "train/total_loss": 0.4020962715148926 + "train/num_positives": 8, + "train/positive_loss": 0.24223516881465912, + "train/total_loss": 0.6211432218551636 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.20799323916435242, - "train/contrastive_loss": 2.757878065109253, - "train/negative_loss": 1.137916922569275, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.619961142539978, - "train/total_loss": 0.7595688104629517 + "train/classification_loss": 0.200800359249115, + "train/contrastive_loss": 2.5807042121887207, + "train/negative_loss": 1.5696772336959839, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0110269784927368, + "train/total_loss": 0.716941237449646 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23943071067333221, - "train/contrastive_loss": 1.1861279010772705, - "train/negative_loss": 0.7122578024864197, - "train/num_negatives": 46, + "train/classification_loss": 0.2878514528274536, + "train/contrastive_loss": 1.995542287826538, + "train/negative_loss": 1.9333635568618774, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.4738701581954956, - "train/total_loss": 0.4766562879085541 + "train/positive_loss": 0.06217879056930542, + "train/total_loss": 0.6869599223136902 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.2995336949825287, - "train/contrastive_loss": 1.992796540260315, - "train/negative_loss": 1.992796540260315, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6980929970741272 - }, - { - "epoch": 3.4220532319391634, - "eval_exact_match_accuracy": 0.10095238095238095, - "eval_hamming_loss": 0.0842577030812325, - "eval_loss": 0.6455292105674744, - "eval_macro_f1": 0.053720140671259145, - "eval_macro_precision": 0.1701112877583466, - "eval_macro_recall": 0.04274372876332816, - "eval_micro_f1": 0.27552986512524086, - "eval_micro_precision": 0.89937106918239, - "eval_micro_recall": 0.1626848691695108, - "eval_runtime": 2.6371, - "eval_samples_per_second": 199.085, - "eval_steps_per_second": 25.028, + "train/classification_loss": 0.2737419307231903, + "train/contrastive_loss": 4.395015716552734, + "train/negative_loss": 3.087554931640625, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 1.307460904121399, + "train/total_loss": 1.1527451276779175 + }, + { + "epoch": 3.169014084507042, + "eval_exact_match_accuracy": 0.10405643738977072, + "eval_hamming_loss": 0.08621226268285091, + "eval_loss": 0.673316478729248, + "eval_macro_f1": 0.06435205817060254, + "eval_macro_precision": 0.16397058823529412, + "eval_macro_recall": 0.051660252363578525, + "eval_micro_f1": 0.25336927223719674, + "eval_micro_precision": 0.8057142857142857, + "eval_micro_recall": 0.15031982942430705, + "eval_runtime": 2.8568, + "eval_samples_per_second": 198.473, + "eval_steps_per_second": 24.853, "step": 900 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.1833040863275528, - "train/contrastive_loss": 1.1892468929290771, - "train/negative_loss": 0.91339111328125, - "train/num_negatives": 48, + "train/classification_loss": 0.2628500759601593, + "train/contrastive_loss": 1.3113716840744019, + "train/negative_loss": 1.305722951889038, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.2758558392524719, - "train/total_loss": 0.4211534857749939 + "train/positive_loss": 0.005648748017847538, + "train/total_loss": 0.5251244306564331 }, { - "epoch": 3.4220532319391634, + "epoch": 3.169014084507042, "step": 900, - "train/classification_loss": 0.23879779875278473, - "train/contrastive_loss": 1.1679967641830444, - "train/negative_loss": 0.9723219275474548, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1956748068332672, - "train/total_loss": 0.4723971486091614 + "train/classification_loss": 0.21615852415561676, + "train/contrastive_loss": 0.9258386492729187, + "train/negative_loss": 0.7519519925117493, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.17388665676116943, + "train/total_loss": 0.4013262391090393 }, { - "epoch": 3.612167300380228, - "grad_norm": 16.154645919799805, - "learning_rate": 1.987108066971081e-05, - "loss": 1.0457, + "epoch": 3.345070422535211, + "grad_norm": 19.28108787536621, + "learning_rate": 1.988076109936575e-05, + "loss": 1.0389, "step": 950 }, { - "epoch": 3.612167300380228, + "epoch": 3.345070422535211, "step": 950, - "train/classification_loss": 0.2011573165655136, - "train/contrastive_loss": 1.702709674835205, - "train/negative_loss": 1.4330796003341675, + "train/classification_loss": 0.2880273461341858, + "train/contrastive_loss": 2.0527405738830566, + "train/negative_loss": 1.7265995740890503, "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.2696301341056824, - "train/total_loss": 0.541699230670929 + "train/num_positives": 4, + "train/positive_loss": 0.3261411190032959, + "train/total_loss": 0.698575496673584 }, { - "epoch": 3.612167300380228, + "epoch": 3.345070422535211, "step": 950, - "train/classification_loss": 0.17787058651447296, - "train/contrastive_loss": 0.8506872653961182, - "train/negative_loss": 0.5546227693557739, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.29606446623802185, - "train/total_loss": 0.34800803661346436 + "train/classification_loss": 0.2285711169242859, + "train/contrastive_loss": 0.9377437829971313, + "train/negative_loss": 0.8507233262062073, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.08702044188976288, + "train/total_loss": 0.41611987352371216 }, { - "epoch": 3.802281368821293, - "grad_norm": 15.187440872192383, - "learning_rate": 1.9863470319634705e-05, - "loss": 0.97, + "epoch": 3.52112676056338, + "grad_norm": 15.228022575378418, + "learning_rate": 1.987371388301621e-05, + "loss": 1.0161, "step": 1000 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2921627163887024, - "train/contrastive_loss": 1.9883853197097778, - "train/negative_loss": 0.9602081775665283, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.0281771421432495, - "train/total_loss": 0.689839780330658 + "train/classification_loss": 0.24659588932991028, + "train/contrastive_loss": 2.060753107070923, + "train/negative_loss": 1.508183479309082, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5525696873664856, + "train/total_loss": 0.6587464809417725 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2613833248615265, - "train/contrastive_loss": 3.6771202087402344, - "train/negative_loss": 1.9760481119155884, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.7010719776153564, - "train/total_loss": 0.996807336807251 + "train/classification_loss": 0.3281591534614563, + "train/contrastive_loss": 1.4071173667907715, + "train/negative_loss": 0.6819202303886414, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.7251971960067749, + "train/total_loss": 0.6095826625823975 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20435497164726257, - "train/contrastive_loss": 2.017838478088379, - "train/negative_loss": 0.5798546671867371, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.4379838705062866, - "train/total_loss": 0.6079226732254028 + "train/classification_loss": 0.2778911888599396, + "train/contrastive_loss": 3.0015885829925537, + "train/negative_loss": 1.6918468475341797, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.309741735458374, + "train/total_loss": 0.8782088756561279 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.21960744261741638, - "train/contrastive_loss": 3.354827404022217, - "train/negative_loss": 1.7749106884002686, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.5799167156219482, - "train/total_loss": 0.8905729055404663 + "train/classification_loss": 0.1679188311100006, + "train/contrastive_loss": 1.164793848991394, + "train/negative_loss": 1.0715124607086182, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.09328135848045349, + "train/total_loss": 0.40087759494781494 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22203326225280762, - "train/contrastive_loss": 1.1554811000823975, - "train/negative_loss": 0.7706438302993774, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.38483723998069763, - "train/total_loss": 0.45312947034835815 + "train/classification_loss": 0.2491820901632309, + "train/contrastive_loss": 2.691622495651245, + "train/negative_loss": 2.2680039405822754, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.42361846566200256, + "train/total_loss": 0.787506639957428 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22906869649887085, - "train/contrastive_loss": 2.250943183898926, - "train/negative_loss": 1.584605097770691, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.6663380861282349, - "train/total_loss": 0.679257333278656 + "train/classification_loss": 0.2490396499633789, + "train/contrastive_loss": 3.1627893447875977, + "train/negative_loss": 1.8857285976409912, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.2770607471466064, + "train/total_loss": 0.8815975189208984 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.28143417835235596, - "train/contrastive_loss": 1.942101240158081, - "train/negative_loss": 1.6364967823028564, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.30560439825057983, - "train/total_loss": 0.6698544025421143 + "train/classification_loss": 0.2303515374660492, + "train/contrastive_loss": 2.1189987659454346, + "train/negative_loss": 1.2774397134780884, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.8415589928627014, + "train/total_loss": 0.6541513204574585 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20754310488700867, - "train/contrastive_loss": 2.8646504878997803, - "train/negative_loss": 1.7477290630340576, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1169214248657227, - "train/total_loss": 0.7804732322692871 + "train/classification_loss": 0.25099775195121765, + "train/contrastive_loss": 1.2132492065429688, + "train/negative_loss": 1.2132288217544556, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 2.0384995877975598e-05, + "train/total_loss": 0.49364757537841797 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.19207996129989624, - "train/contrastive_loss": 2.604841470718384, - "train/negative_loss": 1.6383646726608276, + "train/classification_loss": 0.18784703314304352, + "train/contrastive_loss": 0.7816201448440552, + "train/negative_loss": 0.46114498376846313, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.9664767980575562, - "train/total_loss": 0.7130482792854309 + "train/positive_loss": 0.32047513127326965, + "train/total_loss": 0.34417104721069336 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.30568015575408936, - "train/contrastive_loss": 3.6762945652008057, - "train/negative_loss": 2.6205496788024902, + "train/classification_loss": 0.2678319215774536, + "train/contrastive_loss": 3.3326683044433594, + "train/negative_loss": 1.8832197189331055, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0557448863983154, - "train/total_loss": 1.0409390926361084 + "train/num_positives": 14, + "train/positive_loss": 1.4494484663009644, + "train/total_loss": 0.9343655705451965 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.23100784420967102, - "train/contrastive_loss": 2.42850399017334, - "train/negative_loss": 2.2841129302978516, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.14439107477664948, - "train/total_loss": 0.7167086601257324 + "train/classification_loss": 0.2084895223379135, + "train/contrastive_loss": 1.2625449895858765, + "train/negative_loss": 1.0778404474258423, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.18470454216003418, + "train/total_loss": 0.46099853515625 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.18464529514312744, - "train/contrastive_loss": 1.887596845626831, - "train/negative_loss": 1.0671894550323486, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.8204073905944824, - "train/total_loss": 0.5621646642684937 + "train/classification_loss": 0.2397947907447815, + "train/contrastive_loss": 1.2310004234313965, + "train/negative_loss": 1.2204564809799194, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.010543959215283394, + "train/total_loss": 0.4859948754310608 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2627081871032715, - "train/contrastive_loss": 2.920020818710327, - "train/negative_loss": 2.5588557720184326, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.36116504669189453, - "train/total_loss": 0.8467123508453369 + "train/classification_loss": 0.2481394112110138, + "train/contrastive_loss": 4.0711164474487305, + "train/negative_loss": 2.1748838424682617, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.8962326049804688, + "train/total_loss": 1.0623626708984375 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.1927250176668167, - "train/contrastive_loss": 0.9969231486320496, - "train/negative_loss": 0.9957758784294128, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.001147259958088398, - "train/total_loss": 0.39210963249206543 + "train/classification_loss": 0.278243750333786, + "train/contrastive_loss": 1.6890828609466553, + "train/negative_loss": 1.6558380126953125, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.03324489668011665, + "train/total_loss": 0.6160603165626526 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.18914133310317993, - "train/contrastive_loss": 2.2339835166931152, - "train/negative_loss": 1.7070766687393188, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5269069671630859, - "train/total_loss": 0.6359380483627319 + "train/classification_loss": 0.17101134359836578, + "train/contrastive_loss": 2.4853248596191406, + "train/negative_loss": 1.0175129175186157, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.467811942100525, + "train/total_loss": 0.6680763363838196 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20037218928337097, - "train/contrastive_loss": 1.3182028532028198, - "train/negative_loss": 0.8598129749298096, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.45838984847068787, - "train/total_loss": 0.4640127718448639 + "train/classification_loss": 0.23633305728435516, + "train/contrastive_loss": 1.3315913677215576, + "train/negative_loss": 0.9168295860290527, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.41476184129714966, + "train/total_loss": 0.5026513338088989 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.26817142963409424, - "train/contrastive_loss": 2.7224981784820557, - "train/negative_loss": 2.0936388969421387, - "train/num_negatives": 40, + "train/classification_loss": 0.20215222239494324, + "train/contrastive_loss": 1.2464224100112915, + "train/negative_loss": 0.9159505367279053, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.628859281539917, - "train/total_loss": 0.8126710653305054 + "train/positive_loss": 0.3304719030857086, + "train/total_loss": 0.45143669843673706 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.26218199729919434, - "train/contrastive_loss": 1.0556682348251343, - "train/negative_loss": 0.46694469451904297, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.5887235403060913, - "train/total_loss": 0.47331565618515015 + "train/classification_loss": 0.23914499580860138, + "train/contrastive_loss": 2.2031474113464355, + "train/negative_loss": 1.9642727375030518, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.23887477815151215, + "train/total_loss": 0.6797744631767273 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.25496503710746765, - "train/contrastive_loss": 1.1355866193771362, - "train/negative_loss": 1.131484031677246, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.004102571867406368, - "train/total_loss": 0.4820823669433594 + "train/classification_loss": 0.2514301836490631, + "train/contrastive_loss": 1.0630979537963867, + "train/negative_loss": 1.0438395738601685, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.019258422777056694, + "train/total_loss": 0.464049756526947 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20885993540287018, - "train/contrastive_loss": 4.308316230773926, - "train/negative_loss": 1.9686965942382812, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 2.3396198749542236, - "train/total_loss": 1.0705232620239258 + "train/classification_loss": 0.2085026204586029, + "train/contrastive_loss": 2.897691249847412, + "train/negative_loss": 2.0091145038604736, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8885766863822937, + "train/total_loss": 0.7880408763885498 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.273400217294693, - "train/contrastive_loss": 2.333958148956299, - "train/negative_loss": 1.1083147525787354, - "train/num_negatives": 44, + "train/classification_loss": 0.19692005217075348, + "train/contrastive_loss": 1.5920015573501587, + "train/negative_loss": 1.1873434782028198, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.2256433963775635, - "train/total_loss": 0.7401918172836304 + "train/positive_loss": 0.4046580493450165, + "train/total_loss": 0.515320360660553 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.28959980607032776, - "train/contrastive_loss": 2.981938362121582, - "train/negative_loss": 2.4082112312316895, - "train/num_negatives": 44, + "train/classification_loss": 0.177629753947258, + "train/contrastive_loss": 3.0995242595672607, + "train/negative_loss": 2.2610092163085938, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.573727011680603, - "train/total_loss": 0.8859875202178955 + "train/positive_loss": 0.8385149836540222, + "train/total_loss": 0.7975346446037292 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.18615517020225525, - "train/contrastive_loss": 1.26418137550354, - "train/negative_loss": 0.5543527007102966, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.7098287343978882, - "train/total_loss": 0.4389914572238922 + "train/classification_loss": 0.23684047162532806, + "train/contrastive_loss": 1.7231837511062622, + "train/negative_loss": 1.2479214668273926, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.47526228427886963, + "train/total_loss": 0.5814772248268127 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.17512096464633942, - "train/contrastive_loss": 0.7283112406730652, - "train/negative_loss": 0.5071076154708862, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.22120364010334015, - "train/total_loss": 0.32078319787979126 + "train/classification_loss": 0.2805205285549164, + "train/contrastive_loss": 2.201094150543213, + "train/negative_loss": 1.3151105642318726, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.8859834671020508, + "train/total_loss": 0.7207393646240234 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.1661948412656784, - "train/contrastive_loss": 2.3548004627227783, - "train/negative_loss": 1.4502300024032593, + "train/classification_loss": 0.23459100723266602, + "train/contrastive_loss": 2.1292617321014404, + "train/negative_loss": 0.8994188904762268, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9045704007148743, - "train/total_loss": 0.6371549367904663 + "train/num_positives": 10, + "train/positive_loss": 1.2298427820205688, + "train/total_loss": 0.6604433655738831 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.28712108731269836, - "train/contrastive_loss": 1.4081729650497437, - "train/negative_loss": 0.2224937230348587, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1856791973114014, - "train/total_loss": 0.5687556862831116 + "train/classification_loss": 0.23213499784469604, + "train/contrastive_loss": 2.771615743637085, + "train/negative_loss": 2.22808575630188, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.5435300469398499, + "train/total_loss": 0.7864581346511841 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.26749083399772644, - "train/contrastive_loss": 2.0942084789276123, - "train/negative_loss": 1.8610519170761108, + "train/classification_loss": 0.25737622380256653, + "train/contrastive_loss": 1.7168982028961182, + "train/negative_loss": 1.7139739990234375, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.23315666615962982, - "train/total_loss": 0.6863325238227844 + "train/num_positives": 4, + "train/positive_loss": 0.0029241731390357018, + "train/total_loss": 0.6007558703422546 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2504037320613861, - "train/contrastive_loss": 2.995645523071289, - "train/negative_loss": 2.458055019378662, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5375906229019165, - "train/total_loss": 0.8495328426361084 + "train/classification_loss": 0.24245132505893707, + "train/contrastive_loss": 0.5793294906616211, + "train/negative_loss": 0.5424954891204834, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.03683401271700859, + "train/total_loss": 0.35831722617149353 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2330865114927292, - "train/contrastive_loss": 1.0112091302871704, - "train/negative_loss": 0.9098342061042786, - "train/num_negatives": 40, + "train/classification_loss": 0.2571668028831482, + "train/contrastive_loss": 3.6397993564605713, + "train/negative_loss": 1.5242211818695068, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.10137490183115005, - "train/total_loss": 0.43532833456993103 + "train/positive_loss": 2.1155781745910645, + "train/total_loss": 0.9851266741752625 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2558920681476593, - "train/contrastive_loss": 3.0639405250549316, - "train/negative_loss": 2.1346945762634277, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.9292459487915039, - "train/total_loss": 0.8686802387237549 + "train/classification_loss": 0.2782219648361206, + "train/contrastive_loss": 0.9946987628936768, + "train/negative_loss": 0.9718318581581116, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.02286689728498459, + "train/total_loss": 0.477161705493927 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2231116145849228, - "train/contrastive_loss": 2.0552101135253906, - "train/negative_loss": 0.8453595638275146, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.2098506689071655, - "train/total_loss": 0.6341536641120911 + "train/classification_loss": 0.20099972188472748, + "train/contrastive_loss": 1.7147216796875, + "train/negative_loss": 1.6883797645568848, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.02634197100996971, + "train/total_loss": 0.5439440608024597 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2482825517654419, - "train/contrastive_loss": 2.7635626792907715, - "train/negative_loss": 1.832453727722168, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9311090111732483, - "train/total_loss": 0.8009951114654541 + "train/classification_loss": 0.22822096943855286, + "train/contrastive_loss": 3.840061664581299, + "train/negative_loss": 2.472417116165161, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.3676444292068481, + "train/total_loss": 0.996233344078064 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.3000921905040741, - "train/contrastive_loss": 1.917236328125, - "train/negative_loss": 1.916658639907837, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005777358892373741, - "train/total_loss": 0.6835394501686096 + "train/classification_loss": 0.2354201376438141, + "train/contrastive_loss": 2.713012933731079, + "train/negative_loss": 2.1191723346710205, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5938405394554138, + "train/total_loss": 0.7780227661132812 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2600913345813751, - "train/contrastive_loss": 3.7326407432556152, - "train/negative_loss": 1.6875404119491577, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 2.045100212097168, - "train/total_loss": 1.0066194534301758 + "train/classification_loss": 0.25253626704216003, + "train/contrastive_loss": 1.547911524772644, + "train/negative_loss": 1.4815728664398193, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.0663386881351471, + "train/total_loss": 0.5621185898780823 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.23318879306316376, - "train/contrastive_loss": 2.6206815242767334, - "train/negative_loss": 2.058037281036377, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5626442432403564, - "train/total_loss": 0.7573251128196716 + "train/classification_loss": 0.2873808741569519, + "train/contrastive_loss": 3.0936532020568848, + "train/negative_loss": 2.072852373123169, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.0208008289337158, + "train/total_loss": 0.9061115384101868 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20349553227424622, - "train/contrastive_loss": 3.4421658515930176, - "train/negative_loss": 1.319165587425232, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.123000144958496, - "train/total_loss": 0.8919286727905273 + "train/classification_loss": 0.1729366034269333, + "train/contrastive_loss": 1.9159187078475952, + "train/negative_loss": 1.8947396278381348, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.021179111674427986, + "train/total_loss": 0.5561203360557556 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22472679615020752, - "train/contrastive_loss": 2.995579719543457, - "train/negative_loss": 1.6695185899734497, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 1.3260610103607178, - "train/total_loss": 0.8238427639007568 + "train/classification_loss": 0.25718632340431213, + "train/contrastive_loss": 1.9518499374389648, + "train/negative_loss": 0.9657573103904724, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.9860926270484924, + "train/total_loss": 0.6475563049316406 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22051213681697845, - "train/contrastive_loss": 1.9699492454528809, - "train/negative_loss": 1.6806327104568481, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.2893165051937103, - "train/total_loss": 0.6145020127296448 + "train/classification_loss": 0.30859431624412537, + "train/contrastive_loss": 2.0318307876586914, + "train/negative_loss": 1.8518718481063843, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.1799589991569519, + "train/total_loss": 0.7149604558944702 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2536311149597168, - "train/contrastive_loss": 1.2736643552780151, - "train/negative_loss": 1.2406638860702515, - "train/num_negatives": 46, + "train/classification_loss": 0.2361467033624649, + "train/contrastive_loss": 0.563295841217041, + "train/negative_loss": 0.4943731129169464, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.06892272084951401, + "train/total_loss": 0.34880587458610535 + }, + { + "epoch": 3.52112676056338, + "step": 1000, + "train/classification_loss": 0.2919042408466339, + "train/contrastive_loss": 3.4503490924835205, + "train/negative_loss": 2.130063056945801, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.033000461757183075, - "train/total_loss": 0.5083639621734619 + "train/positive_loss": 1.3202860355377197, + "train/total_loss": 0.9819741249084473 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22962750494480133, - "train/contrastive_loss": 1.6551647186279297, - "train/negative_loss": 1.650994896888733, + "train/classification_loss": 0.1812683790922165, + "train/contrastive_loss": 0.7683617472648621, + "train/negative_loss": 0.6469441652297974, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0041698007844388485, - "train/total_loss": 0.5606604814529419 + "train/num_positives": 10, + "train/positive_loss": 0.1214175820350647, + "train/total_loss": 0.33494073152542114 + }, + { + "epoch": 3.52112676056338, + "step": 1000, + "train/classification_loss": 0.2186700701713562, + "train/contrastive_loss": 3.6752686500549316, + "train/negative_loss": 2.2658612728118896, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.4094072580337524, + "train/total_loss": 0.9537237882614136 + }, + { + "epoch": 3.52112676056338, + "step": 1000, + "train/classification_loss": 0.2589084506034851, + "train/contrastive_loss": 0.94645094871521, + "train/negative_loss": 0.945676863193512, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0007741086883470416, + "train/total_loss": 0.4481986463069916 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.21007344126701355, - "train/contrastive_loss": 1.1497397422790527, - "train/negative_loss": 1.1477009057998657, + "train/classification_loss": 0.2766871154308319, + "train/contrastive_loss": 1.231074333190918, + "train/negative_loss": 1.220503330230713, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.002038854407146573, - "train/total_loss": 0.4400213956832886 + "train/positive_loss": 0.010571012273430824, + "train/total_loss": 0.5229020118713379 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22124463319778442, - "train/contrastive_loss": 1.7481805086135864, - "train/negative_loss": 1.4155763387680054, - "train/num_negatives": 36, + "train/classification_loss": 0.24836365878582, + "train/contrastive_loss": 1.3828072547912598, + "train/negative_loss": 1.3475455045700073, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.03526173159480095, + "train/total_loss": 0.5249251127243042 + }, + { + "epoch": 3.52112676056338, + "step": 1000, + "train/classification_loss": 0.3172628879547119, + "train/contrastive_loss": 3.442688465118408, + "train/negative_loss": 2.3860249519348145, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.33260414004325867, - "train/total_loss": 0.5708807706832886 + "train/positive_loss": 1.0566633939743042, + "train/total_loss": 1.0058006048202515 + }, + { + "epoch": 3.52112676056338, + "step": 1000, + "train/classification_loss": 0.21261222660541534, + "train/contrastive_loss": 1.6953009366989136, + "train/negative_loss": 1.269429326057434, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.4258715808391571, + "train/total_loss": 0.5516723990440369 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.27128276228904724, - "train/contrastive_loss": 1.984393835067749, - "train/negative_loss": 1.8971554040908813, + "train/classification_loss": 0.23725734651088715, + "train/contrastive_loss": 2.443549394607544, + "train/negative_loss": 1.7813152074813843, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.08723849058151245, - "train/total_loss": 0.6681615114212036 + "train/num_positives": 14, + "train/positive_loss": 0.6622342467308044, + "train/total_loss": 0.7259672284126282 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.21653112769126892, - "train/contrastive_loss": 2.2396745681762695, - "train/negative_loss": 2.215695381164551, + "train/classification_loss": 0.2844632863998413, + "train/contrastive_loss": 2.510272979736328, + "train/negative_loss": 2.509378671646118, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.023979177698493004, - "train/total_loss": 0.6644660234451294 + "train/num_positives": 2, + "train/positive_loss": 0.0008944099536165595, + "train/total_loss": 0.7865179181098938 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.19703924655914307, - "train/contrastive_loss": 1.9972243309020996, - "train/negative_loss": 0.7917791604995728, + "train/classification_loss": 0.21981112658977509, + "train/contrastive_loss": 2.5818116664886475, + "train/negative_loss": 1.5117744207382202, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.2054451704025269, - "train/total_loss": 0.5964841246604919 + "train/num_positives": 16, + "train/positive_loss": 1.0700372457504272, + "train/total_loss": 0.7361735105514526 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.30251768231391907, - "train/contrastive_loss": 1.9310388565063477, - "train/negative_loss": 1.8960665464401245, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.03497232869267464, - "train/total_loss": 0.688725471496582 + "train/classification_loss": 0.2378627061843872, + "train/contrastive_loss": 1.1071714162826538, + "train/negative_loss": 0.8405683040618896, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.2666030824184418, + "train/total_loss": 0.4592970013618469 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.17726735770702362, - "train/contrastive_loss": 1.0508182048797607, - "train/negative_loss": 1.0496089458465576, - "train/num_negatives": 48, + "train/classification_loss": 0.2751213312149048, + "train/contrastive_loss": 0.8608742952346802, + "train/negative_loss": 0.6029313206672668, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0012092888355255127, - "train/total_loss": 0.38743099570274353 + "train/positive_loss": 0.25794294476509094, + "train/total_loss": 0.4472962021827698 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20908406376838684, - "train/contrastive_loss": 0.13228189945220947, - "train/negative_loss": 0.11978690326213837, + "train/classification_loss": 0.24389474093914032, + "train/contrastive_loss": 1.2948613166809082, + "train/negative_loss": 0.709494411945343, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.012495003640651703, - "train/total_loss": 0.2355404496192932 + "train/num_positives": 14, + "train/positive_loss": 0.5853668451309204, + "train/total_loss": 0.5028669834136963 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.19231106340885162, - "train/contrastive_loss": 1.4862662553787231, - "train/negative_loss": 1.0895308256149292, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.39673539996147156, - "train/total_loss": 0.48956429958343506 + "train/classification_loss": 0.3243478238582611, + "train/contrastive_loss": 1.8313242197036743, + "train/negative_loss": 1.7057645320892334, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.12555965781211853, + "train/total_loss": 0.6906126737594604 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.25896385312080383, - "train/contrastive_loss": 0.856110692024231, - "train/negative_loss": 0.08941533416509628, - "train/num_negatives": 28, + "train/classification_loss": 0.18626669049263, + "train/contrastive_loss": 1.1465792655944824, + "train/negative_loss": 1.0097198486328125, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.7666953802108765, - "train/total_loss": 0.4301859736442566 + "train/positive_loss": 0.13685943186283112, + "train/total_loss": 0.415582537651062 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.23121429979801178, - "train/contrastive_loss": 2.6802024841308594, - "train/negative_loss": 1.1559433937072754, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.5242589712142944, - "train/total_loss": 0.7672547698020935 + "train/classification_loss": 0.18911504745483398, + "train/contrastive_loss": 1.2773925065994263, + "train/negative_loss": 0.5432942509651184, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.7340982556343079, + "train/total_loss": 0.44459354877471924 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20908303558826447, - "train/contrastive_loss": 1.123455286026001, - "train/negative_loss": 1.1211652755737305, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0022899534087628126, - "train/total_loss": 0.43377411365509033 + "train/classification_loss": 0.22916723787784576, + "train/contrastive_loss": 1.9191935062408447, + "train/negative_loss": 1.0063399076461792, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9128535389900208, + "train/total_loss": 0.6130059361457825 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22374683618545532, - "train/contrastive_loss": 2.468479633331299, - "train/negative_loss": 1.3443044424057007, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1241753101348877, - "train/total_loss": 0.7174427509307861 + "train/classification_loss": 0.2522820830345154, + "train/contrastive_loss": 2.130955219268799, + "train/negative_loss": 1.295016884803772, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.8359382152557373, + "train/total_loss": 0.6784731149673462 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.25712263584136963, - "train/contrastive_loss": 3.888007402420044, - "train/negative_loss": 2.359877824783325, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.5281295776367188, - "train/total_loss": 1.0347241163253784 + "train/classification_loss": 0.2548275589942932, + "train/contrastive_loss": 1.3030062913894653, + "train/negative_loss": 1.2422012090682983, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.06080511212348938, + "train/total_loss": 0.5154287815093994 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2342974692583084, - "train/contrastive_loss": 2.583207368850708, - "train/negative_loss": 0.8391510248184204, + "train/classification_loss": 0.20139287412166595, + "train/contrastive_loss": 0.4285404682159424, + "train/negative_loss": 0.3663267195224762, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.7440563440322876, - "train/total_loss": 0.7509389519691467 + "train/num_positives": 16, + "train/positive_loss": 0.062213748693466187, + "train/total_loss": 0.28710097074508667 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20095603168010712, - "train/contrastive_loss": 4.0681233406066895, - "train/negative_loss": 2.476071357727051, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5920518636703491, - "train/total_loss": 1.0145807266235352 + "train/classification_loss": 0.24033991992473602, + "train/contrastive_loss": 2.683631181716919, + "train/negative_loss": 1.7628206014633179, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.9208105206489563, + "train/total_loss": 0.777066171169281 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.27246713638305664, - "train/contrastive_loss": 2.923830986022949, - "train/negative_loss": 1.873626470565796, + "train/classification_loss": 0.295841783285141, + "train/contrastive_loss": 3.220322608947754, + "train/negative_loss": 1.9369618892669678, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.0502046346664429, - "train/total_loss": 0.8572333455085754 + "train/num_positives": 2, + "train/positive_loss": 1.2833607196807861, + "train/total_loss": 0.9399063587188721 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.24500462412834167, - "train/contrastive_loss": 3.1717844009399414, - "train/negative_loss": 2.718250274658203, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.4535340666770935, - "train/total_loss": 0.8793615102767944 + "train/classification_loss": 0.18783165514469147, + "train/contrastive_loss": 2.452139377593994, + "train/negative_loss": 1.7211363315582275, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.7310030460357666, + "train/total_loss": 0.678259551525116 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2031930536031723, - "train/contrastive_loss": 2.8647594451904297, - "train/negative_loss": 1.0771702527999878, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.787589192390442, - "train/total_loss": 0.7761449813842773 + "train/classification_loss": 0.23536640405654907, + "train/contrastive_loss": 1.9533640146255493, + "train/negative_loss": 1.7359412908554077, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.21742267906665802, + "train/total_loss": 0.6260392069816589 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22679395973682404, - "train/contrastive_loss": 2.7319140434265137, - "train/negative_loss": 1.6165672540664673, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.115346908569336, - "train/total_loss": 0.7731767892837524 + "train/classification_loss": 0.26207321882247925, + "train/contrastive_loss": 1.5476288795471191, + "train/negative_loss": 1.0087196826934814, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.5389091968536377, + "train/total_loss": 0.571599006652832 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.24705463647842407, - "train/contrastive_loss": 3.5699172019958496, - "train/negative_loss": 2.3284988403320312, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.241418480873108, - "train/total_loss": 0.9610381126403809 + "train/classification_loss": 0.2266044020652771, + "train/contrastive_loss": 3.437208652496338, + "train/negative_loss": 3.4371867179870605, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.185210178140551e-05, + "train/total_loss": 0.9140461683273315 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.2577287554740906, - "train/contrastive_loss": 2.0264906883239746, - "train/negative_loss": 1.6251473426818848, + "train/classification_loss": 0.24644531309604645, + "train/contrastive_loss": 1.173646092414856, + "train/negative_loss": 0.5878365635871887, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.401343435049057, - "train/total_loss": 0.6630269289016724 + "train/positive_loss": 0.5858095288276672, + "train/total_loss": 0.4811745285987854 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.22843895852565765, - "train/contrastive_loss": 1.2286640405654907, - "train/negative_loss": 1.2285631895065308, + "train/classification_loss": 0.2580612301826477, + "train/contrastive_loss": 2.2025082111358643, + "train/negative_loss": 1.7459800243377686, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00010089068382512778, - "train/total_loss": 0.4741717576980591 + "train/num_positives": 8, + "train/positive_loss": 0.4565282464027405, + "train/total_loss": 0.6985628604888916 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.20521306991577148, - "train/contrastive_loss": 1.5498706102371216, - "train/negative_loss": 0.6216142773628235, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9282563328742981, - "train/total_loss": 0.5151872038841248 + "train/classification_loss": 0.19897712767124176, + "train/contrastive_loss": 3.304173469543457, + "train/negative_loss": 1.8232210874557495, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.480952501296997, + "train/total_loss": 0.8598118424415588 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.230923593044281, - "train/contrastive_loss": 1.4803950786590576, - "train/negative_loss": 1.1502041816711426, - "train/num_negatives": 46, + "train/classification_loss": 0.28154003620147705, + "train/contrastive_loss": 1.8293871879577637, + "train/negative_loss": 1.365809440612793, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.3301909267902374, - "train/total_loss": 0.5270025730133057 + "train/positive_loss": 0.4635777473449707, + "train/total_loss": 0.6474174857139587 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.29073429107666016, - "train/contrastive_loss": 2.1672143936157227, - "train/negative_loss": 2.1672143936157227, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.7241771817207336 - }, - { - "epoch": 3.802281368821293, - "eval_exact_match_accuracy": 0.1180952380952381, - "eval_hamming_loss": 0.08291316526610644, - "eval_loss": 0.6774991750717163, - "eval_macro_f1": 0.0699432328036483, - "eval_macro_precision": 0.163046633126935, - "eval_macro_recall": 0.050106681597401004, - "eval_micro_f1": 0.28982725527831094, - "eval_micro_precision": 0.9263803680981595, - "eval_micro_recall": 0.17178612059158135, - "eval_runtime": 2.6208, - "eval_samples_per_second": 200.323, - "eval_steps_per_second": 25.183, + "train/classification_loss": 0.2619515657424927, + "train/contrastive_loss": 2.638002395629883, + "train/negative_loss": 1.7948802709579468, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.8431222438812256, + "train/total_loss": 0.7895520329475403 + }, + { + "epoch": 3.52112676056338, + "eval_exact_match_accuracy": 0.1164021164021164, + "eval_hamming_loss": 0.08382612304180932, + "eval_loss": 0.6472141742706299, + "eval_macro_f1": 0.08606886646339473, + "eval_macro_precision": 0.15593506219692177, + "eval_macro_recall": 0.06341313724661743, + "eval_micro_f1": 0.2798573975044563, + "eval_micro_precision": 0.8532608695652174, + "eval_micro_recall": 0.1673773987206823, + "eval_runtime": 2.839, + "eval_samples_per_second": 199.715, + "eval_steps_per_second": 25.008, "step": 1000 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.23623208701610565, - "train/contrastive_loss": 0.6931478977203369, - "train/negative_loss": 0.2563442885875702, - "train/num_negatives": 28, - "train/num_positives": 18, - "train/positive_loss": 0.4368036091327667, - "train/total_loss": 0.3748616576194763 + "train/classification_loss": 0.20714882016181946, + "train/contrastive_loss": 1.2321231365203857, + "train/negative_loss": 0.6984319090843201, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5336912870407104, + "train/total_loss": 0.45357346534729004 }, { - "epoch": 3.802281368821293, + "epoch": 3.52112676056338, "step": 1000, - "train/classification_loss": 0.25138843059539795, - "train/contrastive_loss": 0.9785668849945068, - "train/negative_loss": 0.6237108707427979, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.354856014251709, - "train/total_loss": 0.4471018314361572 + "train/classification_loss": 0.2867993116378784, + "train/contrastive_loss": 1.9529364109039307, + "train/negative_loss": 1.218223214149475, + "train/num_negatives": 22, + "train/num_positives": 24, + "train/positive_loss": 0.7347131967544556, + "train/total_loss": 0.6773866415023804 }, { - "epoch": 3.9923954372623576, - "grad_norm": 13.786935806274414, - "learning_rate": 1.9855859969558603e-05, - "loss": 1.0065, + "epoch": 3.697183098591549, + "grad_norm": 17.127878189086914, + "learning_rate": 1.9866666666666667e-05, + "loss": 0.9922, "step": 1050 }, { - "epoch": 3.9923954372623576, + "epoch": 3.697183098591549, "step": 1050, - "train/classification_loss": 0.2684571146965027, - "train/contrastive_loss": 1.0206866264343262, - "train/negative_loss": 1.0206866264343262, - "train/num_negatives": 50, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.4725944399833679 + "train/classification_loss": 0.2515946626663208, + "train/contrastive_loss": 1.5435893535614014, + "train/negative_loss": 0.8575651049613953, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.6860242486000061, + "train/total_loss": 0.5603125095367432 }, { - "epoch": 3.9923954372623576, + "epoch": 3.697183098591549, "step": 1050, - "train/classification_loss": 0.24986664950847626, - "train/contrastive_loss": 1.888816237449646, - "train/negative_loss": 0.929886519908905, - "train/num_negatives": 34, - "train/num_positives": 14, - "train/positive_loss": 0.958929717540741, - "train/total_loss": 0.6276298761367798 + "train/classification_loss": 0.25624769926071167, + "train/contrastive_loss": 0.8319815397262573, + "train/negative_loss": 0.7657333016395569, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.06624826043844223, + "train/total_loss": 0.4226440191268921 }, { - "epoch": 4.182509505703422, - "grad_norm": 18.117549896240234, - "learning_rate": 1.9848249619482498e-05, - "loss": 0.9737, + "epoch": 3.873239436619718, + "grad_norm": 11.773343086242676, + "learning_rate": 1.9859619450317125e-05, + "loss": 0.9917, "step": 1100 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2668207287788391, - "train/contrastive_loss": 0.9192310571670532, - "train/negative_loss": 0.5305595397949219, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.38867148756980896, - "train/total_loss": 0.45066696405410767 + "train/classification_loss": 0.23831522464752197, + "train/contrastive_loss": 2.427889823913574, + "train/negative_loss": 2.3044111728668213, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.12347874045372009, + "train/total_loss": 0.7238931655883789 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.26099029183387756, - "train/contrastive_loss": 2.419377326965332, - "train/negative_loss": 1.4203153848648071, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.9990618824958801, - "train/total_loss": 0.7448657751083374 + "train/classification_loss": 0.3279215395450592, + "train/contrastive_loss": 2.4086203575134277, + "train/negative_loss": 2.1797428131103516, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.22887754440307617, + "train/total_loss": 0.8096456527709961 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19658173620700836, - "train/contrastive_loss": 2.922646999359131, - "train/negative_loss": 1.4450081586837769, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.477638840675354, - "train/total_loss": 0.7811111211776733 + "train/classification_loss": 0.2689489424228668, + "train/contrastive_loss": 2.8508143424987793, + "train/negative_loss": 2.243807554244995, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.6070067286491394, + "train/total_loss": 0.8391118049621582 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.20297516882419586, - "train/contrastive_loss": 2.467620372772217, - "train/negative_loss": 2.0907623767852783, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.3768579661846161, - "train/total_loss": 0.696499228477478 + "train/classification_loss": 0.17307421565055847, + "train/contrastive_loss": 2.916548252105713, + "train/negative_loss": 2.9024291038513184, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.014119124040007591, + "train/total_loss": 0.7563838958740234 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21071162819862366, - "train/contrastive_loss": 1.9756425619125366, - "train/negative_loss": 1.7376790046691895, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.23796354234218597, - "train/total_loss": 0.6058401465415955 + "train/classification_loss": 0.23352594673633575, + "train/contrastive_loss": 4.547475337982178, + "train/negative_loss": 4.540761470794678, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.00671407300978899, + "train/total_loss": 1.1430209875106812 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2180548459291458, - "train/contrastive_loss": 1.847900152206421, - "train/negative_loss": 1.5013225078582764, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.34657764434814453, - "train/total_loss": 0.5876348614692688 + "train/classification_loss": 0.24048519134521484, + "train/contrastive_loss": 2.9878389835357666, + "train/negative_loss": 2.5133676528930664, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.4744713008403778, + "train/total_loss": 0.8380529880523682 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2676788568496704, - "train/contrastive_loss": 1.4847862720489502, - "train/negative_loss": 1.0579952001571655, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.4267910122871399, - "train/total_loss": 0.5646361112594604 + "train/classification_loss": 0.22496269643306732, + "train/contrastive_loss": 3.085120677947998, + "train/negative_loss": 1.4385730028152466, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.6465476751327515, + "train/total_loss": 0.8419868350028992 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.18839603662490845, - "train/contrastive_loss": 1.0893162488937378, - "train/negative_loss": 0.991484522819519, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.09783173352479935, - "train/total_loss": 0.40625929832458496 + "train/classification_loss": 0.2456701546907425, + "train/contrastive_loss": 1.4610172510147095, + "train/negative_loss": 1.4609971046447754, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 2.014657366089523e-05, + "train/total_loss": 0.5378736257553101 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.18721319735050201, - "train/contrastive_loss": 1.2844542264938354, - "train/negative_loss": 1.251680612564087, + "train/classification_loss": 0.17375747859477997, + "train/contrastive_loss": 0.6639258861541748, + "train/negative_loss": 0.5872737169265747, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.03277360647916794, - "train/total_loss": 0.44410407543182373 + "train/positive_loss": 0.07665219157934189, + "train/total_loss": 0.30654266476631165 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.30845382809638977, - "train/contrastive_loss": 3.599503993988037, - "train/negative_loss": 2.080617666244507, + "train/classification_loss": 0.2648347318172455, + "train/contrastive_loss": 3.2213895320892334, + "train/negative_loss": 2.68839693069458, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.5188863277435303, - "train/total_loss": 1.0283546447753906 + "train/num_positives": 14, + "train/positive_loss": 0.5329925417900085, + "train/total_loss": 0.9091126918792725 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21449322998523712, - "train/contrastive_loss": 1.6141719818115234, - "train/negative_loss": 1.2524513006210327, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3617207109928131, - "train/total_loss": 0.5373276472091675 + "train/classification_loss": 0.19973190128803253, + "train/contrastive_loss": 1.3084367513656616, + "train/negative_loss": 1.2911714315414429, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.017265362665057182, + "train/total_loss": 0.4614192843437195 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.1748025268316269, - "train/contrastive_loss": 1.31058931350708, - "train/negative_loss": 1.074753761291504, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.23583559691905975, - "train/total_loss": 0.4369204044342041 + "train/classification_loss": 0.23393574357032776, + "train/contrastive_loss": 2.3132243156433105, + "train/negative_loss": 2.2991549968719482, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.014069284312427044, + "train/total_loss": 0.6965806484222412 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2648574113845825, - "train/contrastive_loss": 4.9353532791137695, - "train/negative_loss": 2.446695327758789, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.4886577129364014, - "train/total_loss": 1.2519280910491943 + "train/classification_loss": 0.24310286343097687, + "train/contrastive_loss": 4.247648239135742, + "train/negative_loss": 2.6359286308288574, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.6117196083068848, + "train/total_loss": 1.092632532119751 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.18789063394069672, - "train/contrastive_loss": 2.83552885055542, - "train/negative_loss": 2.8323540687561035, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.003174758516252041, - "train/total_loss": 0.7549964189529419 + "train/classification_loss": 0.257038414478302, + "train/contrastive_loss": 1.3331999778747559, + "train/negative_loss": 1.2541568279266357, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.07904312014579773, + "train/total_loss": 0.5236784219741821 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.1858423948287964, - "train/contrastive_loss": 2.6916558742523193, - "train/negative_loss": 1.9690110683441162, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.7226448059082031, - "train/total_loss": 0.7241736054420471 + "train/classification_loss": 0.1624750941991806, + "train/contrastive_loss": 1.777597427368164, + "train/negative_loss": 0.9836911559104919, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.7939062118530273, + "train/total_loss": 0.5179945826530457 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19036194682121277, - "train/contrastive_loss": 0.7931206822395325, - "train/negative_loss": 0.7704713344573975, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.022649375721812248, - "train/total_loss": 0.34898608922958374 + "train/classification_loss": 0.23082579672336578, + "train/contrastive_loss": 1.6016342639923096, + "train/negative_loss": 1.4055243730545044, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.19610992074012756, + "train/total_loss": 0.5511526465415955 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2694917321205139, - "train/contrastive_loss": 2.901045083999634, - "train/negative_loss": 2.274977684020996, - "train/num_negatives": 40, + "train/classification_loss": 0.19881311058998108, + "train/contrastive_loss": 1.967290997505188, + "train/negative_loss": 1.9302352666854858, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.6260673403739929, - "train/total_loss": 0.8497007489204407 + "train/positive_loss": 0.03705578297376633, + "train/total_loss": 0.5922713279724121 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2498902678489685, - "train/contrastive_loss": 1.0433846712112427, - "train/negative_loss": 0.30051958560943604, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7428650856018066, - "train/total_loss": 0.45856720209121704 + "train/classification_loss": 0.23374062776565552, + "train/contrastive_loss": 2.46852445602417, + "train/negative_loss": 2.39452862739563, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.07399576902389526, + "train/total_loss": 0.7274454832077026 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.25613826513290405, - "train/contrastive_loss": 2.0351057052612305, - "train/negative_loss": 2.0298376083374023, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.005268200300633907, - "train/total_loss": 0.6631593704223633 + "train/classification_loss": 0.24928463995456696, + "train/contrastive_loss": 1.578418254852295, + "train/negative_loss": 1.5245360136032104, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.053882207721471786, + "train/total_loss": 0.5649682879447937 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19453038275241852, - "train/contrastive_loss": 1.8485159873962402, - "train/negative_loss": 1.171599268913269, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6769167184829712, - "train/total_loss": 0.5642336010932922 + "train/classification_loss": 0.20311260223388672, + "train/contrastive_loss": 2.4354147911071777, + "train/negative_loss": 2.2176971435546875, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.21771764755249023, + "train/total_loss": 0.6901955604553223 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2798168659210205, - "train/contrastive_loss": 2.5056469440460205, - "train/negative_loss": 1.2100244760513306, - "train/num_negatives": 44, + "train/classification_loss": 0.18941310048103333, + "train/contrastive_loss": 2.361656904220581, + "train/negative_loss": 1.9931424856185913, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.29562246799469, - "train/total_loss": 0.7809462547302246 + "train/positive_loss": 0.36851444840431213, + "train/total_loss": 0.6617444753646851 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2921021282672882, - "train/contrastive_loss": 2.3105199337005615, - "train/negative_loss": 1.7036676406860352, - "train/num_negatives": 44, + "train/classification_loss": 0.17063772678375244, + "train/contrastive_loss": 2.5735113620758057, + "train/negative_loss": 2.4765305519104004, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.6068523526191711, - "train/total_loss": 0.754206120967865 + "train/positive_loss": 0.09698088467121124, + "train/total_loss": 0.6853399872779846 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.17488445341587067, - "train/contrastive_loss": 0.9257868528366089, - "train/negative_loss": 0.40497493743896484, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.520811915397644, - "train/total_loss": 0.3600418269634247 + "train/classification_loss": 0.2295491248369217, + "train/contrastive_loss": 3.1196184158325195, + "train/negative_loss": 1.6238735914230347, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.4957447052001953, + "train/total_loss": 0.8534728288650513 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.1726226508617401, - "train/contrastive_loss": 0.3532654345035553, - "train/negative_loss": 0.3417278230190277, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.011537617072463036, - "train/total_loss": 0.2432757318019867 + "train/classification_loss": 0.26753488183021545, + "train/contrastive_loss": 3.100071668624878, + "train/negative_loss": 2.682760000228882, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.4173116087913513, + "train/total_loss": 0.8875492811203003 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.15534253418445587, - "train/contrastive_loss": 1.756361484527588, - "train/negative_loss": 1.6153217554092407, + "train/classification_loss": 0.2236568033695221, + "train/contrastive_loss": 1.2429547309875488, + "train/negative_loss": 1.1811189651489258, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.14103974401950836, - "train/total_loss": 0.5066148638725281 + "train/num_positives": 10, + "train/positive_loss": 0.06183582544326782, + "train/total_loss": 0.47224774956703186 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2799184024333954, - "train/contrastive_loss": 1.53036630153656, - "train/negative_loss": 0.540463387966156, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.989902913570404, - "train/total_loss": 0.5859916806221008 + "train/classification_loss": 0.22711753845214844, + "train/contrastive_loss": 3.682501792907715, + "train/negative_loss": 3.281054973602295, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.4014468491077423, + "train/total_loss": 0.9636179208755493 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2791735827922821, - "train/contrastive_loss": 2.5850682258605957, - "train/negative_loss": 1.8083932399749756, + "train/classification_loss": 0.25347572565078735, + "train/contrastive_loss": 2.073573350906372, + "train/negative_loss": 2.0726492404937744, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7766749262809753, - "train/total_loss": 0.7961872816085815 + "train/num_positives": 4, + "train/positive_loss": 0.0009240152430720627, + "train/total_loss": 0.6681903600692749 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.23146189749240875, - "train/contrastive_loss": 1.7876026630401611, - "train/negative_loss": 1.608972191810608, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.17863047122955322, - "train/total_loss": 0.5889824628829956 + "train/classification_loss": 0.2347225546836853, + "train/contrastive_loss": 1.01730215549469, + "train/negative_loss": 1.0127335786819458, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.004568600561469793, + "train/total_loss": 0.4381830096244812 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.22719351947307587, - "train/contrastive_loss": 0.7956789135932922, - "train/negative_loss": 0.7463369369506836, - "train/num_negatives": 40, + "train/classification_loss": 0.26009488105773926, + "train/contrastive_loss": 3.5207643508911133, + "train/negative_loss": 1.9920603036880493, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.04934195429086685, - "train/total_loss": 0.3863292932510376 + "train/positive_loss": 1.5287041664123535, + "train/total_loss": 0.9642477631568909 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.24516166746616364, - "train/contrastive_loss": 1.0034472942352295, - "train/negative_loss": 0.7667389512062073, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.23670828342437744, - "train/total_loss": 0.4458511471748352 + "train/classification_loss": 0.2768598198890686, + "train/contrastive_loss": 1.423134446144104, + "train/negative_loss": 1.416304588317871, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.0068298340775072575, + "train/total_loss": 0.5614867210388184 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21536126732826233, - "train/contrastive_loss": 1.6731003522872925, - "train/negative_loss": 0.7142210006713867, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.9588793516159058, - "train/total_loss": 0.5499813556671143 + "train/classification_loss": 0.19549112021923065, + "train/contrastive_loss": 2.6246564388275146, + "train/negative_loss": 2.6213796138763428, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.003276816103607416, + "train/total_loss": 0.7204224467277527 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.24722589552402496, - "train/contrastive_loss": 3.1206254959106445, - "train/negative_loss": 2.0089404582977295, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.111685037612915, - "train/total_loss": 0.8713510036468506 + "train/classification_loss": 0.2180773764848709, + "train/contrastive_loss": 3.728764295578003, + "train/negative_loss": 3.021785020828247, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7069792151451111, + "train/total_loss": 0.9638302326202393 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2828051745891571, - "train/contrastive_loss": 0.8083522915840149, - "train/negative_loss": 0.8038268685340881, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.004525395110249519, - "train/total_loss": 0.4444756507873535 + "train/classification_loss": 0.22918613255023956, + "train/contrastive_loss": 3.689828395843506, + "train/negative_loss": 3.0234792232513428, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.6663492321968079, + "train/total_loss": 0.9671518206596375 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2499246597290039, - "train/contrastive_loss": 1.927088975906372, - "train/negative_loss": 1.7217016220092773, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.20538738369941711, - "train/total_loss": 0.6353424787521362 + "train/classification_loss": 0.25230127573013306, + "train/contrastive_loss": 3.1345293521881104, + "train/negative_loss": 1.7227782011032104, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 1.4117511510849, + "train/total_loss": 0.8792071342468262 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.24331827461719513, - "train/contrastive_loss": 4.942056655883789, - "train/negative_loss": 3.1065292358398438, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.8355271816253662, - "train/total_loss": 1.2317296266555786 + "train/classification_loss": 0.284618616104126, + "train/contrastive_loss": 2.3714370727539062, + "train/negative_loss": 1.9443162679672241, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.4271208643913269, + "train/total_loss": 0.7589060068130493 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.20164476335048676, - "train/contrastive_loss": 3.606774091720581, - "train/negative_loss": 2.0573363304138184, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.5494377613067627, - "train/total_loss": 0.9229996204376221 + "train/classification_loss": 0.17087684571743011, + "train/contrastive_loss": 2.491471767425537, + "train/negative_loss": 2.4905407428741455, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.000930906506255269, + "train/total_loss": 0.6691712141036987 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2059522569179535, - "train/contrastive_loss": 2.9247050285339355, - "train/negative_loss": 2.6467437744140625, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.2779611647129059, - "train/total_loss": 0.7908933162689209 + "train/classification_loss": 0.25164154171943665, + "train/contrastive_loss": 2.440986394882202, + "train/negative_loss": 2.041640520095825, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.39934593439102173, + "train/total_loss": 0.7398388385772705 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21676059067249298, - "train/contrastive_loss": 2.379136800765991, - "train/negative_loss": 1.781358242034912, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.5977785587310791, - "train/total_loss": 0.6925879716873169 + "train/classification_loss": 0.3038838803768158, + "train/contrastive_loss": 1.4890421628952026, + "train/negative_loss": 1.3099987506866455, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.17904341220855713, + "train/total_loss": 0.6016923189163208 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2540681064128876, - "train/contrastive_loss": 1.8045587539672852, - "train/negative_loss": 1.6730177402496338, - "train/num_negatives": 46, + "train/classification_loss": 0.23057648539543152, + "train/contrastive_loss": 1.0312519073486328, + "train/negative_loss": 0.9848721623420715, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.04637974873185158, + "train/total_loss": 0.4368268847465515 + }, + { + "epoch": 3.873239436619718, + "step": 1100, + "train/classification_loss": 0.2917994260787964, + "train/contrastive_loss": 5.907462120056152, + "train/negative_loss": 2.056241750717163, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.13154105842113495, - "train/total_loss": 0.6149798631668091 + "train/positive_loss": 3.85122013092041, + "train/total_loss": 1.4732918739318848 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2215055525302887, - "train/contrastive_loss": 1.7963535785675049, - "train/negative_loss": 1.7883410453796387, + "train/classification_loss": 0.17872579395771027, + "train/contrastive_loss": 1.196420669555664, + "train/negative_loss": 1.0647977590560913, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.008012540638446808, - "train/total_loss": 0.5807762742042542 + "train/num_positives": 10, + "train/positive_loss": 0.13162286579608917, + "train/total_loss": 0.4180099368095398 + }, + { + "epoch": 3.873239436619718, + "step": 1100, + "train/classification_loss": 0.20605939626693726, + "train/contrastive_loss": 2.464670181274414, + "train/negative_loss": 2.334632635116577, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.13003748655319214, + "train/total_loss": 0.698993444442749 + }, + { + "epoch": 3.873239436619718, + "step": 1100, + "train/classification_loss": 0.2552935481071472, + "train/contrastive_loss": 1.8695108890533447, + "train/negative_loss": 1.8687865734100342, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0007242750725708902, + "train/total_loss": 0.6291956901550293 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.212464839220047, - "train/contrastive_loss": 2.3838467597961426, - "train/negative_loss": 1.8664510250091553, + "train/classification_loss": 0.2797108590602875, + "train/contrastive_loss": 0.9901911616325378, + "train/negative_loss": 0.9834886193275452, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.5173958539962769, - "train/total_loss": 0.68923419713974 + "train/positive_loss": 0.00670256931334734, + "train/total_loss": 0.4777491092681885 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21989482641220093, - "train/contrastive_loss": 2.0414488315582275, - "train/negative_loss": 1.797282338142395, - "train/num_negatives": 36, + "train/classification_loss": 0.24419371783733368, + "train/contrastive_loss": 1.9920066595077515, + "train/negative_loss": 1.8763504028320312, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.1156562864780426, + "train/total_loss": 0.6425950527191162 + }, + { + "epoch": 3.873239436619718, + "step": 1100, + "train/classification_loss": 0.3122989237308502, + "train/contrastive_loss": 2.5958714485168457, + "train/negative_loss": 1.685879111289978, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.24416647851467133, - "train/total_loss": 0.6281845569610596 + "train/positive_loss": 0.9099923372268677, + "train/total_loss": 0.8314732313156128 + }, + { + "epoch": 3.873239436619718, + "step": 1100, + "train/classification_loss": 0.20681218802928925, + "train/contrastive_loss": 2.322512626647949, + "train/negative_loss": 2.1041202545166016, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.2183922678232193, + "train/total_loss": 0.6713147163391113 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.26418378949165344, - "train/contrastive_loss": 2.096250534057617, - "train/negative_loss": 1.871886134147644, + "train/classification_loss": 0.2414204627275467, + "train/contrastive_loss": 3.609355926513672, + "train/negative_loss": 3.08012318611145, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.2243644893169403, - "train/total_loss": 0.6834338903427124 + "train/num_positives": 14, + "train/positive_loss": 0.5292326211929321, + "train/total_loss": 0.9632916450500488 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.20290325582027435, - "train/contrastive_loss": 1.3768373727798462, - "train/negative_loss": 1.1588186025619507, + "train/classification_loss": 0.2742444574832916, + "train/contrastive_loss": 2.749952554702759, + "train/negative_loss": 2.749920606613159, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.2180187702178955, - "train/total_loss": 0.4782707095146179 + "train/num_positives": 2, + "train/positive_loss": 3.194859891664237e-05, + "train/total_loss": 0.8242349624633789 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.18267783522605896, - "train/contrastive_loss": 1.6962816715240479, - "train/negative_loss": 0.708185613155365, + "train/classification_loss": 0.21579399704933167, + "train/contrastive_loss": 2.344604969024658, + "train/negative_loss": 1.9381828308105469, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9880959987640381, - "train/total_loss": 0.5219341516494751 + "train/num_positives": 16, + "train/positive_loss": 0.40642213821411133, + "train/total_loss": 0.6847150325775146 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.3069040775299072, - "train/contrastive_loss": 1.37820303440094, - "train/negative_loss": 1.27793550491333, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.10026757419109344, - "train/total_loss": 0.5825446844100952 + "train/classification_loss": 0.2289884239435196, + "train/contrastive_loss": 1.2784075736999512, + "train/negative_loss": 1.1660082340240479, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.11239929497241974, + "train/total_loss": 0.48466992378234863 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.1680459976196289, - "train/contrastive_loss": 1.2695292234420776, - "train/negative_loss": 1.269436240196228, - "train/num_negatives": 48, + "train/classification_loss": 0.26019981503486633, + "train/contrastive_loss": 0.932488203048706, + "train/negative_loss": 0.781326413154602, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 9.296923963120207e-05, - "train/total_loss": 0.42195186018943787 + "train/positive_loss": 0.1511618047952652, + "train/total_loss": 0.446697473526001 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19722016155719757, - "train/contrastive_loss": 0.20405307412147522, - "train/negative_loss": 0.20106415450572968, + "train/classification_loss": 0.23466898500919342, + "train/contrastive_loss": 1.225492238998413, + "train/negative_loss": 1.1051048040390015, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.0029889268334954977, - "train/total_loss": 0.23803077638149261 + "train/num_positives": 14, + "train/positive_loss": 0.12038746476173401, + "train/total_loss": 0.47976744174957275 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.18109764158725739, - "train/contrastive_loss": 1.0783178806304932, - "train/negative_loss": 1.0699362754821777, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.008381661958992481, - "train/total_loss": 0.3967612385749817 + "train/classification_loss": 0.3182857632637024, + "train/contrastive_loss": 2.451718330383301, + "train/negative_loss": 2.353672504425049, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.09804584830999374, + "train/total_loss": 0.8086293935775757 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2596445381641388, - "train/contrastive_loss": 1.2702559232711792, - "train/negative_loss": 1.257446050643921, - "train/num_negatives": 28, + "train/classification_loss": 0.1761728674173355, + "train/contrastive_loss": 1.9230961799621582, + "train/negative_loss": 1.9159491062164307, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.012809840962290764, - "train/total_loss": 0.5136957168579102 + "train/positive_loss": 0.007147099357098341, + "train/total_loss": 0.560792088508606 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2248270958662033, - "train/contrastive_loss": 2.0854337215423584, - "train/negative_loss": 1.3445037603378296, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.740929901599884, - "train/total_loss": 0.6419138312339783 + "train/classification_loss": 0.17623940110206604, + "train/contrastive_loss": 0.9000499248504639, + "train/negative_loss": 0.8372023105621338, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.06284762918949127, + "train/total_loss": 0.3562493920326233 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19955314695835114, - "train/contrastive_loss": 1.0166773796081543, - "train/negative_loss": 1.003315806388855, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.013361582532525063, - "train/total_loss": 0.40288862586021423 + "train/classification_loss": 0.21636329591274261, + "train/contrastive_loss": 1.6189684867858887, + "train/negative_loss": 1.589046835899353, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.029921649023890495, + "train/total_loss": 0.5401570200920105 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.21929931640625, - "train/contrastive_loss": 1.6632907390594482, - "train/negative_loss": 1.4202933311462402, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.242997407913208, - "train/total_loss": 0.5519574880599976 + "train/classification_loss": 0.24555574357509613, + "train/contrastive_loss": 2.163731098175049, + "train/negative_loss": 1.5679959058761597, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.5957351326942444, + "train/total_loss": 0.678301990032196 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.24395239353179932, - "train/contrastive_loss": 3.0102789402008057, - "train/negative_loss": 2.332637071609497, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6776419281959534, - "train/total_loss": 0.8460081815719604 + "train/classification_loss": 0.24967283010482788, + "train/contrastive_loss": 1.6834166049957275, + "train/negative_loss": 1.6079005002975464, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.07551614940166473, + "train/total_loss": 0.5863561630249023 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2162342667579651, - "train/contrastive_loss": 1.4474358558654785, - "train/negative_loss": 0.47811517119407654, + "train/classification_loss": 0.18836277723312378, + "train/contrastive_loss": 0.3667788505554199, + "train/negative_loss": 0.35757413506507874, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9693207144737244, - "train/total_loss": 0.5057214498519897 + "train/num_positives": 16, + "train/positive_loss": 0.009204700589179993, + "train/total_loss": 0.2617185413837433 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.20283320546150208, - "train/contrastive_loss": 2.931414842605591, - "train/negative_loss": 1.9867736101150513, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9446412920951843, - "train/total_loss": 0.7891161441802979 + "train/classification_loss": 0.2358929067850113, + "train/contrastive_loss": 2.9412269592285156, + "train/negative_loss": 2.490908145904541, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.4503189027309418, + "train/total_loss": 0.8241382837295532 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.26606225967407227, - "train/contrastive_loss": 2.975637912750244, - "train/negative_loss": 1.8630505800247192, + "train/classification_loss": 0.2816947102546692, + "train/contrastive_loss": 4.933274269104004, + "train/negative_loss": 2.0538012981414795, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.1125874519348145, - "train/total_loss": 0.8611898422241211 + "train/num_positives": 2, + "train/positive_loss": 2.8794729709625244, + "train/total_loss": 1.2683496475219727 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2345093935728073, - "train/contrastive_loss": 1.8298792839050293, - "train/negative_loss": 1.7545764446258545, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.07530281692743301, - "train/total_loss": 0.6004852652549744 + "train/classification_loss": 0.17934270203113556, + "train/contrastive_loss": 3.210433006286621, + "train/negative_loss": 2.8731000423431396, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.33733296394348145, + "train/total_loss": 0.8214293122291565 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.20351941883563995, - "train/contrastive_loss": 2.2129974365234375, - "train/negative_loss": 1.704502820968628, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5084947347640991, - "train/total_loss": 0.6461189389228821 + "train/classification_loss": 0.21843379735946655, + "train/contrastive_loss": 0.5027125477790833, + "train/negative_loss": 0.48300161957740784, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.019710931926965714, + "train/total_loss": 0.3189763128757477 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2249593734741211, - "train/contrastive_loss": 2.978782892227173, - "train/negative_loss": 1.9885690212249756, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.9902138113975525, - "train/total_loss": 0.8207159638404846 + "train/classification_loss": 0.25661149621009827, + "train/contrastive_loss": 1.5218721628189087, + "train/negative_loss": 1.3274472951889038, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.1944248378276825, + "train/total_loss": 0.5609859228134155 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.23822341859340668, - "train/contrastive_loss": 4.478044509887695, - "train/negative_loss": 3.905503034591675, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.5725417137145996, - "train/total_loss": 1.133832335472107 + "train/classification_loss": 0.22328856587409973, + "train/contrastive_loss": 4.805528163909912, + "train/negative_loss": 4.8055100440979, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.8239355995319784e-05, + "train/total_loss": 1.1843942403793335 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.26300716400146484, - "train/contrastive_loss": 3.551175117492676, - "train/negative_loss": 2.7143514156341553, + "train/classification_loss": 0.23724225163459778, + "train/contrastive_loss": 1.5536742210388184, + "train/negative_loss": 1.1341301202774048, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.8368237614631653, - "train/total_loss": 0.9732422232627869 + "train/positive_loss": 0.4195440411567688, + "train/total_loss": 0.547977089881897 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2259279489517212, - "train/contrastive_loss": 0.7470934391021729, - "train/negative_loss": 0.746955156326294, + "train/classification_loss": 0.2464766800403595, + "train/contrastive_loss": 2.8333542346954346, + "train/negative_loss": 2.789071559906006, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0001382718182867393, - "train/total_loss": 0.37534666061401367 + "train/num_positives": 8, + "train/positive_loss": 0.044282764196395874, + "train/total_loss": 0.8131475448608398 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.19525264203548431, - "train/contrastive_loss": 2.6279296875, - "train/negative_loss": 1.9456558227539062, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6822739839553833, - "train/total_loss": 0.7208386063575745 + "train/classification_loss": 0.19211798906326294, + "train/contrastive_loss": 3.807598829269409, + "train/negative_loss": 2.323927402496338, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.4836714267730713, + "train/total_loss": 0.9536377787590027 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.22731608152389526, - "train/contrastive_loss": 1.2634410858154297, - "train/negative_loss": 1.1149497032165527, - "train/num_negatives": 46, + "train/classification_loss": 0.2839981019496918, + "train/contrastive_loss": 2.131500244140625, + "train/negative_loss": 1.8393489122390747, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.14849135279655457, - "train/total_loss": 0.48000431060791016 + "train/positive_loss": 0.29215145111083984, + "train/total_loss": 0.7102981805801392 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.286465048789978, - "train/contrastive_loss": 1.7569940090179443, - "train/negative_loss": 1.7569940090179443, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6378638744354248 - }, - { - "epoch": 4.182509505703422, - "eval_exact_match_accuracy": 0.14095238095238094, - "eval_hamming_loss": 0.08067226890756303, - "eval_loss": 0.6336852312088013, - "eval_macro_f1": 0.08309941004388503, - "eval_macro_precision": 0.15145652944257848, - "eval_macro_recall": 0.06404947400110854, - "eval_micro_f1": 0.34545454545454546, - "eval_micro_precision": 0.8597285067873304, - "eval_micro_recall": 0.2161547212741752, - "eval_runtime": 2.6342, - "eval_samples_per_second": 199.301, - "eval_steps_per_second": 25.055, + "train/classification_loss": 0.24952849745750427, + "train/contrastive_loss": 1.4020882844924927, + "train/negative_loss": 1.3898981809616089, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.012190134264528751, + "train/total_loss": 0.5299461483955383 + }, + { + "epoch": 3.873239436619718, + "eval_exact_match_accuracy": 0.13580246913580246, + "eval_hamming_loss": 0.08185496420790539, + "eval_loss": 0.7055002450942993, + "eval_macro_f1": 0.0969632603746814, + "eval_macro_precision": 0.2131724484665661, + "eval_macro_recall": 0.07356533001391038, + "eval_micro_f1": 0.31569817866435385, + "eval_micro_precision": 0.8465116279069768, + "eval_micro_recall": 0.19402985074626866, + "eval_runtime": 2.8482, + "eval_samples_per_second": 199.076, + "eval_steps_per_second": 24.928, "step": 1100 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.2238336205482483, - "train/contrastive_loss": 1.7947561740875244, - "train/negative_loss": 1.1132816076278687, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.681474506855011, - "train/total_loss": 0.58278489112854 + "train/classification_loss": 0.2119203507900238, + "train/contrastive_loss": 0.9280003905296326, + "train/negative_loss": 0.8303496241569519, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.09765076637268066, + "train/total_loss": 0.39752042293548584 }, { - "epoch": 4.182509505703422, + "epoch": 3.873239436619718, "step": 1100, - "train/classification_loss": 0.22213032841682434, - "train/contrastive_loss": 0.8697492480278015, - "train/negative_loss": 0.8580467104911804, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.011702514253556728, - "train/total_loss": 0.3960801959037781 + "train/classification_loss": 0.20301856100559235, + "train/contrastive_loss": 1.0431458950042725, + "train/negative_loss": 0.81928950548172, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.22385644912719727, + "train/total_loss": 0.4116477370262146 }, { - "epoch": 4.3726235741444865, - "grad_norm": 11.801966667175293, - "learning_rate": 1.9840639269406396e-05, - "loss": 0.9953, + "epoch": 4.049295774647887, + "grad_norm": 13.688472747802734, + "learning_rate": 1.9852572233967583e-05, + "loss": 0.9753, "step": 1150 }, { - "epoch": 4.3726235741444865, + "epoch": 4.049295774647887, "step": 1150, - "train/classification_loss": 0.14190496504306793, - "train/contrastive_loss": 0.7074056267738342, - "train/negative_loss": 0.4608888030052185, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.24651682376861572, - "train/total_loss": 0.28338611125946045 + "train/classification_loss": 0.35411015152931213, + "train/contrastive_loss": 1.787449598312378, + "train/negative_loss": 1.4512560367584229, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.33619359135627747, + "train/total_loss": 0.7116000652313232 }, { - "epoch": 4.3726235741444865, + "epoch": 4.049295774647887, "step": 1150, - "train/classification_loss": 0.2316829115152359, - "train/contrastive_loss": 1.4150776863098145, - "train/negative_loss": 0.9924721121788025, + "train/classification_loss": 0.23314321041107178, + "train/contrastive_loss": 0.7754062414169312, + "train/negative_loss": 0.6427779793739319, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.42260557413101196, - "train/total_loss": 0.5146984457969666 + "train/num_positives": 10, + "train/positive_loss": 0.13262827694416046, + "train/total_loss": 0.3882244825363159 }, { - "epoch": 4.562737642585551, - "grad_norm": 14.427437782287598, - "learning_rate": 1.983302891933029e-05, - "loss": 0.9564, + "epoch": 4.225352112676056, + "grad_norm": 20.463239669799805, + "learning_rate": 1.984552501761804e-05, + "loss": 0.9533, "step": 1200 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.26839759945869446, - "train/contrastive_loss": 1.4577640295028687, - "train/negative_loss": 0.4718663692474365, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.9858976602554321, - "train/total_loss": 0.5599504113197327 + "train/classification_loss": 0.23820097744464874, + "train/contrastive_loss": 2.2195143699645996, + "train/negative_loss": 2.1864240169525146, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.033090438693761826, + "train/total_loss": 0.6821038722991943 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.24855321645736694, - "train/contrastive_loss": 2.0087995529174805, - "train/negative_loss": 1.4150294065475464, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5937700271606445, - "train/total_loss": 0.650313138961792 + "train/classification_loss": 0.3126511871814728, + "train/contrastive_loss": 1.3029661178588867, + "train/negative_loss": 0.6426699757575989, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6602961421012878, + "train/total_loss": 0.5732444524765015 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19469839334487915, - "train/contrastive_loss": 2.7767744064331055, - "train/negative_loss": 1.6205757856369019, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1561986207962036, - "train/total_loss": 0.7500532865524292 + "train/classification_loss": 0.26902809739112854, + "train/contrastive_loss": 3.3653273582458496, + "train/negative_loss": 2.093282461166382, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.2720450162887573, + "train/total_loss": 0.9420936107635498 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.20229922235012054, - "train/contrastive_loss": 2.2982749938964844, - "train/negative_loss": 1.7591887712478638, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.5390862226486206, - "train/total_loss": 0.6619542241096497 + "train/classification_loss": 0.16100594401359558, + "train/contrastive_loss": 1.5097841024398804, + "train/negative_loss": 1.4639619588851929, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.04582216963171959, + "train/total_loss": 0.4629627764225006 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19738365709781647, - "train/contrastive_loss": 1.5024912357330322, - "train/negative_loss": 1.2989826202392578, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.20350860059261322, - "train/total_loss": 0.4978818893432617 + "train/classification_loss": 0.23391561210155487, + "train/contrastive_loss": 2.871906280517578, + "train/negative_loss": 2.5959837436676025, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.2759224474430084, + "train/total_loss": 0.8082969188690186 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.21106307208538055, - "train/contrastive_loss": 2.1400768756866455, - "train/negative_loss": 1.776803731918335, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.3632732331752777, - "train/total_loss": 0.6390784382820129 + "train/classification_loss": 0.23714615404605865, + "train/contrastive_loss": 2.5147595405578613, + "train/negative_loss": 1.66135573387146, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8534036874771118, + "train/total_loss": 0.7400980591773987 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.26182296872138977, - "train/contrastive_loss": 1.5999494791030884, - "train/negative_loss": 1.2278475761413574, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.37210190296173096, - "train/total_loss": 0.581812858581543 + "train/classification_loss": 0.22908292710781097, + "train/contrastive_loss": 2.4958722591400146, + "train/negative_loss": 1.5669571161270142, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9289150834083557, + "train/total_loss": 0.7282573580741882 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.20036856830120087, - "train/contrastive_loss": 2.113412857055664, - "train/negative_loss": 1.77034330368042, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.34306952357292175, - "train/total_loss": 0.6230511665344238 + "train/classification_loss": 0.24315716326236725, + "train/contrastive_loss": 1.147068977355957, + "train/negative_loss": 1.146935224533081, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.000133761772303842, + "train/total_loss": 0.4725709557533264 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1829265058040619, - "train/contrastive_loss": 1.8287562131881714, - "train/negative_loss": 1.7817643880844116, + "train/classification_loss": 0.16732251644134521, + "train/contrastive_loss": 0.6897497773170471, + "train/negative_loss": 0.4277394711971283, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.046991802752017975, - "train/total_loss": 0.5486777424812317 + "train/positive_loss": 0.2620103061199188, + "train/total_loss": 0.3052724599838257 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.3075816333293915, - "train/contrastive_loss": 3.598410129547119, - "train/negative_loss": 1.682419776916504, + "train/classification_loss": 0.25074175000190735, + "train/contrastive_loss": 2.818326711654663, + "train/negative_loss": 1.9771109819412231, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.9159903526306152, - "train/total_loss": 1.0272636413574219 + "train/num_positives": 14, + "train/positive_loss": 0.8412157297134399, + "train/total_loss": 0.8144071102142334 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.21599867939949036, - "train/contrastive_loss": 1.8275816440582275, - "train/negative_loss": 1.6661471128463745, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.16143453121185303, - "train/total_loss": 0.5815150141716003 + "train/classification_loss": 0.20019780099391937, + "train/contrastive_loss": 2.1182432174682617, + "train/negative_loss": 0.9785182476043701, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.139724850654602, + "train/total_loss": 0.6238464713096619 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.17099152505397797, - "train/contrastive_loss": 0.9310785531997681, - "train/negative_loss": 0.7932378649711609, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.1378406584262848, - "train/total_loss": 0.3572072386741638 + "train/classification_loss": 0.22391721606254578, + "train/contrastive_loss": 1.2828621864318848, + "train/negative_loss": 1.268310785293579, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.014551392756402493, + "train/total_loss": 0.48048967123031616 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.26226329803466797, - "train/contrastive_loss": 2.7469491958618164, - "train/negative_loss": 1.942963719367981, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8039854764938354, - "train/total_loss": 0.8116531372070312 + "train/classification_loss": 0.23621715605258942, + "train/contrastive_loss": 3.8077096939086914, + "train/negative_loss": 2.278451681137085, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.529257893562317, + "train/total_loss": 0.9977591037750244 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.17936202883720398, - "train/contrastive_loss": 2.4849205017089844, - "train/negative_loss": 2.4835410118103027, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0013794123660773039, - "train/total_loss": 0.6763461232185364 + "train/classification_loss": 0.2610945701599121, + "train/contrastive_loss": 1.9956432580947876, + "train/negative_loss": 1.9374083280563354, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.058234892785549164, + "train/total_loss": 0.6602232456207275 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.17135244607925415, - "train/contrastive_loss": 2.0377914905548096, - "train/negative_loss": 1.9605740308761597, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.07721735537052155, - "train/total_loss": 0.5789107084274292 + "train/classification_loss": 0.16263200342655182, + "train/contrastive_loss": 2.7147724628448486, + "train/negative_loss": 0.9403889775276184, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.774383544921875, + "train/total_loss": 0.7055864930152893 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.18525448441505432, - "train/contrastive_loss": 0.8919479846954346, - "train/negative_loss": 0.8295565247535706, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.06239144131541252, - "train/total_loss": 0.3636440634727478 + "train/classification_loss": 0.22432219982147217, + "train/contrastive_loss": 2.260737895965576, + "train/negative_loss": 1.2054569721221924, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 1.0552810430526733, + "train/total_loss": 0.6764698028564453 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.27018457651138306, - "train/contrastive_loss": 2.5182361602783203, - "train/negative_loss": 1.6847496032714844, - "train/num_negatives": 40, + "train/classification_loss": 0.18923906981945038, + "train/contrastive_loss": 1.4630100727081299, + "train/negative_loss": 0.9888707399368286, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8334864377975464, - "train/total_loss": 0.773831844329834 + "train/positive_loss": 0.47413939237594604, + "train/total_loss": 0.4818410873413086 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2329711765050888, - "train/contrastive_loss": 1.1303975582122803, - "train/negative_loss": 0.2916741371154785, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8387234210968018, - "train/total_loss": 0.4590506851673126 + "train/classification_loss": 0.22521206736564636, + "train/contrastive_loss": 2.3338253498077393, + "train/negative_loss": 2.046501636505127, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.28732380270957947, + "train/total_loss": 0.6919771432876587 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.24080206453800201, - "train/contrastive_loss": 1.7278066873550415, - "train/negative_loss": 1.7254767417907715, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.00232996279373765, - "train/total_loss": 0.5863634347915649 + "train/classification_loss": 0.22657722234725952, + "train/contrastive_loss": 1.4559969902038574, + "train/negative_loss": 0.9023036360740662, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.553693413734436, + "train/total_loss": 0.517776608467102 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1912085860967636, - "train/contrastive_loss": 2.116460084915161, - "train/negative_loss": 1.8914873600006104, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.22497273981571198, - "train/total_loss": 0.6145005822181702 + "train/classification_loss": 0.2026662528514862, + "train/contrastive_loss": 3.5434229373931885, + "train/negative_loss": 2.0275583267211914, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.515864610671997, + "train/total_loss": 0.9113508462905884 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.27608394622802734, - "train/contrastive_loss": 2.8884315490722656, - "train/negative_loss": 1.4030414819717407, - "train/num_negatives": 44, + "train/classification_loss": 0.1881251037120819, + "train/contrastive_loss": 1.39735746383667, + "train/negative_loss": 1.3268437385559082, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.485390067100525, - "train/total_loss": 0.8537702560424805 + "train/positive_loss": 0.07051370292901993, + "train/total_loss": 0.4675965905189514 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.27678975462913513, - "train/contrastive_loss": 1.7279530763626099, - "train/negative_loss": 1.4989614486694336, - "train/num_negatives": 44, + "train/classification_loss": 0.16246214509010315, + "train/contrastive_loss": 2.396956443786621, + "train/negative_loss": 1.8029283285140991, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.22899167239665985, - "train/total_loss": 0.6223803758621216 + "train/positive_loss": 0.594028115272522, + "train/total_loss": 0.6418534517288208 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.16067586839199066, - "train/contrastive_loss": 0.6379473805427551, - "train/negative_loss": 0.458501935005188, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.17944544553756714, - "train/total_loss": 0.2882653474807739 + "train/classification_loss": 0.22203607857227325, + "train/contrastive_loss": 2.9253249168395996, + "train/negative_loss": 1.178288221359253, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.7470366954803467, + "train/total_loss": 0.8071010708808899 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.16618803143501282, - "train/contrastive_loss": 0.7172693610191345, - "train/negative_loss": 0.6985741853713989, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.018695151433348656, - "train/total_loss": 0.30964189767837524 + "train/classification_loss": 0.2596926987171173, + "train/contrastive_loss": 2.795374870300293, + "train/negative_loss": 1.4317823648452759, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.3635923862457275, + "train/total_loss": 0.8187676668167114 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1453627496957779, - "train/contrastive_loss": 1.8768666982650757, - "train/negative_loss": 1.8718293905258179, + "train/classification_loss": 0.21991199254989624, + "train/contrastive_loss": 1.9777274131774902, + "train/negative_loss": 1.2168290615081787, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.005037267226725817, - "train/total_loss": 0.5207360982894897 + "train/num_positives": 10, + "train/positive_loss": 0.7608982920646667, + "train/total_loss": 0.6154574751853943 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2762885093688965, - "train/contrastive_loss": 1.5779829025268555, - "train/negative_loss": 0.6431745886802673, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9348082542419434, - "train/total_loss": 0.5918850898742676 + "train/classification_loss": 0.2313278615474701, + "train/contrastive_loss": 2.268214702606201, + "train/negative_loss": 1.3194770812988281, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.948737621307373, + "train/total_loss": 0.6849707961082458 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.27747032046318054, - "train/contrastive_loss": 2.4941368103027344, - "train/negative_loss": 1.7425068616867065, + "train/classification_loss": 0.2507913410663605, + "train/contrastive_loss": 2.532198905944824, + "train/negative_loss": 2.511834144592285, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7516298294067383, - "train/total_loss": 0.7762976884841919 + "train/num_positives": 4, + "train/positive_loss": 0.02036474645137787, + "train/total_loss": 0.7572311162948608 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.22189392149448395, - "train/contrastive_loss": 1.4438281059265137, - "train/negative_loss": 1.406640887260437, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.03718717396259308, - "train/total_loss": 0.5106595754623413 + "train/classification_loss": 0.22977498173713684, + "train/contrastive_loss": 0.4995616674423218, + "train/negative_loss": 0.4863865375518799, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.013175136409699917, + "train/total_loss": 0.32968732714653015 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2235237956047058, - "train/contrastive_loss": 1.44865083694458, - "train/negative_loss": 0.6642740368843079, - "train/num_negatives": 40, + "train/classification_loss": 0.2593741714954376, + "train/contrastive_loss": 3.8490519523620605, + "train/negative_loss": 2.156369686126709, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.7843768000602722, - "train/total_loss": 0.513253927230835 + "train/positive_loss": 1.692682147026062, + "train/total_loss": 1.0291845798492432 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.23907078802585602, - "train/contrastive_loss": 1.87262761592865, - "train/negative_loss": 1.4635987281799316, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.40902891755104065, - "train/total_loss": 0.6135963201522827 + "train/classification_loss": 0.2559356689453125, + "train/contrastive_loss": 0.7395895719528198, + "train/negative_loss": 0.7330122590065002, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.006577320396900177, + "train/total_loss": 0.4038535952568054 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19864046573638916, - "train/contrastive_loss": 2.456331729888916, - "train/negative_loss": 1.7687199115753174, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.6876117587089539, - "train/total_loss": 0.6899068355560303 + "train/classification_loss": 0.18498210608959198, + "train/contrastive_loss": 1.246114730834961, + "train/negative_loss": 1.2213551998138428, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.024759579449892044, + "train/total_loss": 0.4342050552368164 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2457301765680313, - "train/contrastive_loss": 3.40838623046875, - "train/negative_loss": 2.5386738777160645, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8697124719619751, - "train/total_loss": 0.927407443523407 + "train/classification_loss": 0.21050065755844116, + "train/contrastive_loss": 3.0388805866241455, + "train/negative_loss": 2.182076930999756, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8568036556243896, + "train/total_loss": 0.8182767629623413 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2786455750465393, - "train/contrastive_loss": 0.8429851531982422, - "train/negative_loss": 0.8422391414642334, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007459918851964176, - "train/total_loss": 0.4472426176071167 + "train/classification_loss": 0.21962806582450867, + "train/contrastive_loss": 2.28347110748291, + "train/negative_loss": 1.1052113771438599, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.1782597303390503, + "train/total_loss": 0.6763222813606262 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.24050572514533997, - "train/contrastive_loss": 2.1463565826416016, - "train/negative_loss": 2.122020959854126, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.024335643276572227, - "train/total_loss": 0.6697770357131958 + "train/classification_loss": 0.2414647489786148, + "train/contrastive_loss": 2.0475215911865234, + "train/negative_loss": 1.9549386501312256, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.09258290380239487, + "train/total_loss": 0.6509690880775452 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.22759895026683807, - "train/contrastive_loss": 4.702112674713135, - "train/negative_loss": 2.595444917678833, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.1066677570343018, - "train/total_loss": 1.1680214405059814 + "train/classification_loss": 0.26383158564567566, + "train/contrastive_loss": 3.209746837615967, + "train/negative_loss": 1.8684909343719482, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.3412559032440186, + "train/total_loss": 0.9057809114456177 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19805331528186798, - "train/contrastive_loss": 4.068561553955078, - "train/negative_loss": 2.2213776111602783, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.847184181213379, - "train/total_loss": 1.0117655992507935 + "train/classification_loss": 0.16165506839752197, + "train/contrastive_loss": 1.9002012014389038, + "train/negative_loss": 1.8871245384216309, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.013076669536530972, + "train/total_loss": 0.5416953563690186 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.20499426126480103, - "train/contrastive_loss": 2.600393533706665, - "train/negative_loss": 2.1040635108947754, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.49633005261421204, - "train/total_loss": 0.725072979927063 + "train/classification_loss": 0.2387543022632599, + "train/contrastive_loss": 1.91302490234375, + "train/negative_loss": 1.2365256547927856, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.6764992475509644, + "train/total_loss": 0.6213592886924744 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2089759260416031, - "train/contrastive_loss": 1.4349807500839233, - "train/negative_loss": 1.3129751682281494, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.12200554460287094, - "train/total_loss": 0.4959720969200134 + "train/classification_loss": 0.2853037416934967, + "train/contrastive_loss": 3.1011276245117188, + "train/negative_loss": 3.092477560043335, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.00864995177835226, + "train/total_loss": 0.905529260635376 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2354596108198166, - "train/contrastive_loss": 1.3213410377502441, - "train/negative_loss": 1.3203091621398926, - "train/num_negatives": 46, + "train/classification_loss": 0.22179660201072693, + "train/contrastive_loss": 0.533164381980896, + "train/negative_loss": 0.5205826163291931, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0125817796215415, + "train/total_loss": 0.3284294903278351 + }, + { + "epoch": 4.225352112676056, + "step": 1200, + "train/classification_loss": 0.27831244468688965, + "train/contrastive_loss": 5.48289680480957, + "train/negative_loss": 3.590162754058838, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.0010319247376173735, - "train/total_loss": 0.49972784519195557 + "train/positive_loss": 1.8927342891693115, + "train/total_loss": 1.3748918771743774 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2204185128211975, - "train/contrastive_loss": 3.387333869934082, - "train/negative_loss": 2.699774980545044, + "train/classification_loss": 0.17007887363433838, + "train/contrastive_loss": 0.6487374305725098, + "train/negative_loss": 0.5470332503318787, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.6875588893890381, - "train/total_loss": 0.8978853225708008 + "train/num_positives": 10, + "train/positive_loss": 0.1017041951417923, + "train/total_loss": 0.29982638359069824 + }, + { + "epoch": 4.225352112676056, + "step": 1200, + "train/classification_loss": 0.20303687453269958, + "train/contrastive_loss": 2.851569652557373, + "train/negative_loss": 1.6394004821777344, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.2121692895889282, + "train/total_loss": 0.7733508348464966 + }, + { + "epoch": 4.225352112676056, + "step": 1200, + "train/classification_loss": 0.2422710806131363, + "train/contrastive_loss": 1.0220674276351929, + "train/negative_loss": 1.0196876525878906, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.002379767596721649, + "train/total_loss": 0.4466845691204071 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.20552989840507507, - "train/contrastive_loss": 1.3679394721984863, - "train/negative_loss": 1.2776373624801636, + "train/classification_loss": 0.27504763007164, + "train/contrastive_loss": 1.2418322563171387, + "train/negative_loss": 1.2355135679244995, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.09030213207006454, - "train/total_loss": 0.47911781072616577 + "train/positive_loss": 0.006318744271993637, + "train/total_loss": 0.5234140753746033 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2059558779001236, - "train/contrastive_loss": 3.013817310333252, - "train/negative_loss": 2.929060220718384, - "train/num_negatives": 36, + "train/classification_loss": 0.2379591315984726, + "train/contrastive_loss": 1.6048810482025146, + "train/negative_loss": 1.3263897895812988, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.2784913182258606, + "train/total_loss": 0.5589353442192078 + }, + { + "epoch": 4.225352112676056, + "step": 1200, + "train/classification_loss": 0.3087451159954071, + "train/contrastive_loss": 3.5816688537597656, + "train/negative_loss": 3.331193447113037, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.08475709706544876, - "train/total_loss": 0.8087193369865417 + "train/positive_loss": 0.25047552585601807, + "train/total_loss": 1.0250788927078247 + }, + { + "epoch": 4.225352112676056, + "step": 1200, + "train/classification_loss": 0.19379587471485138, + "train/contrastive_loss": 1.7554895877838135, + "train/negative_loss": 1.3410553932189941, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.41443419456481934, + "train/total_loss": 0.5448938012123108 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2514001131057739, - "train/contrastive_loss": 1.1490168571472168, - "train/negative_loss": 1.034923791885376, + "train/classification_loss": 0.2315230667591095, + "train/contrastive_loss": 2.369478225708008, + "train/negative_loss": 1.7959967851638794, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.1140931248664856, - "train/total_loss": 0.48120349645614624 + "train/num_positives": 14, + "train/positive_loss": 0.573481559753418, + "train/total_loss": 0.7054187059402466 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.20319001376628876, - "train/contrastive_loss": 2.28110933303833, - "train/negative_loss": 1.6794915199279785, + "train/classification_loss": 0.2758389115333557, + "train/contrastive_loss": 2.6423323154449463, + "train/negative_loss": 2.6422619819641113, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6016177535057068, - "train/total_loss": 0.6594119071960449 + "train/num_positives": 2, + "train/positive_loss": 7.033595466054976e-05, + "train/total_loss": 0.804305374622345 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.17435213923454285, - "train/contrastive_loss": 1.4656281471252441, - "train/negative_loss": 0.9639892578125, + "train/classification_loss": 0.21867045760154724, + "train/contrastive_loss": 2.055758237838745, + "train/negative_loss": 1.3003343343734741, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5016388893127441, - "train/total_loss": 0.4674777686595917 + "train/num_positives": 16, + "train/positive_loss": 0.755423903465271, + "train/total_loss": 0.6298221349716187 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.29912638664245605, - "train/contrastive_loss": 1.6367400884628296, - "train/negative_loss": 1.4498403072357178, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.18689975142478943, - "train/total_loss": 0.6264743804931641 + "train/classification_loss": 0.21739840507507324, + "train/contrastive_loss": 1.3960161209106445, + "train/negative_loss": 1.1293599605560303, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.26665621995925903, + "train/total_loss": 0.4966016411781311 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.163253515958786, - "train/contrastive_loss": 1.985257863998413, - "train/negative_loss": 1.9852070808410645, - "train/num_negatives": 48, + "train/classification_loss": 0.24844343960285187, + "train/contrastive_loss": 0.8801074028015137, + "train/negative_loss": 0.4586319029331207, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 5.07555014337413e-05, - "train/total_loss": 0.560305118560791 + "train/positive_loss": 0.42147552967071533, + "train/total_loss": 0.4244649410247803 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.18570803105831146, - "train/contrastive_loss": 0.12421001493930817, - "train/negative_loss": 0.12394455820322037, + "train/classification_loss": 0.23639611899852753, + "train/contrastive_loss": 1.2823047637939453, + "train/negative_loss": 0.7736068367958069, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.0002654590643942356, - "train/total_loss": 0.21055004000663757 + "train/num_positives": 14, + "train/positive_loss": 0.5086979269981384, + "train/total_loss": 0.49285709857940674 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1604071706533432, - "train/contrastive_loss": 0.5751709938049316, - "train/negative_loss": 0.5742742419242859, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0008967560715973377, - "train/total_loss": 0.27544137835502625 + "train/classification_loss": 0.31819280982017517, + "train/contrastive_loss": 2.318375825881958, + "train/negative_loss": 1.9652572870254517, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.3531185984611511, + "train/total_loss": 0.7818679809570312 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.24296583235263824, - "train/contrastive_loss": 0.6734508275985718, - "train/negative_loss": 0.6157106757164001, - "train/num_negatives": 28, + "train/classification_loss": 0.1730251908302307, + "train/contrastive_loss": 1.403673768043518, + "train/negative_loss": 1.2460966110229492, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.05774018168449402, - "train/total_loss": 0.3776559829711914 + "train/positive_loss": 0.15757720172405243, + "train/total_loss": 0.45375993847846985 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.22031164169311523, - "train/contrastive_loss": 2.112429141998291, - "train/negative_loss": 1.455772042274475, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6566569805145264, - "train/total_loss": 0.6427974700927734 + "train/classification_loss": 0.1673741340637207, + "train/contrastive_loss": 1.0294147729873657, + "train/negative_loss": 0.5770444273948669, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.4523703157901764, + "train/total_loss": 0.3732571005821228 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19519221782684326, - "train/contrastive_loss": 1.166387677192688, - "train/negative_loss": 1.1660339832305908, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0003536841832101345, - "train/total_loss": 0.42846977710723877 + "train/classification_loss": 0.2136966735124588, + "train/contrastive_loss": 3.459001302719116, + "train/negative_loss": 1.811866283416748, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.6471350193023682, + "train/total_loss": 0.9054969549179077 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2163453996181488, - "train/contrastive_loss": 1.816586971282959, - "train/negative_loss": 0.9901488423347473, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8264381289482117, - "train/total_loss": 0.5796627998352051 + "train/classification_loss": 0.230219304561615, + "train/contrastive_loss": 2.9058241844177246, + "train/negative_loss": 1.434438705444336, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.4713853597640991, + "train/total_loss": 0.8113841414451599 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2443111389875412, - "train/contrastive_loss": 1.9039762020111084, - "train/negative_loss": 1.519092321395874, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.38488394021987915, - "train/total_loss": 0.6251063942909241 + "train/classification_loss": 0.24400371313095093, + "train/contrastive_loss": 1.9538731575012207, + "train/negative_loss": 1.9181960821151733, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.03567707538604736, + "train/total_loss": 0.6347783803939819 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2105715274810791, - "train/contrastive_loss": 0.865288257598877, - "train/negative_loss": 0.6259064078330994, + "train/classification_loss": 0.180061936378479, + "train/contrastive_loss": 0.370182603597641, + "train/negative_loss": 0.34648385643959045, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.2393818348646164, - "train/total_loss": 0.3836292028427124 + "train/num_positives": 16, + "train/positive_loss": 0.02369873598217964, + "train/total_loss": 0.25409847497940063 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.19144181907176971, - "train/contrastive_loss": 3.1919474601745605, - "train/negative_loss": 2.3381521701812744, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.8537951707839966, - "train/total_loss": 0.8298313617706299 + "train/classification_loss": 0.21889282763004303, + "train/contrastive_loss": 2.6643178462982178, + "train/negative_loss": 1.7027565240859985, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.961561381816864, + "train/total_loss": 0.7517563700675964 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.25484737753868103, - "train/contrastive_loss": 2.382009267807007, - "train/negative_loss": 1.7951282262802124, + "train/classification_loss": 0.2903638184070587, + "train/contrastive_loss": 2.4090704917907715, + "train/negative_loss": 1.8289307355880737, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.5868809819221497, - "train/total_loss": 0.731249213218689 + "train/num_positives": 2, + "train/positive_loss": 0.5801397562026978, + "train/total_loss": 0.7721779346466064 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2358301728963852, - "train/contrastive_loss": 2.4589428901672363, - "train/negative_loss": 2.331228733062744, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.12771406769752502, - "train/total_loss": 0.7276187539100647 + "train/classification_loss": 0.17654463648796082, + "train/contrastive_loss": 2.6437220573425293, + "train/negative_loss": 1.5578287839889526, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0858933925628662, + "train/total_loss": 0.7052890062332153 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1986648589372635, - "train/contrastive_loss": 2.04693603515625, - "train/negative_loss": 1.6210026741027832, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4259333312511444, - "train/total_loss": 0.6080520749092102 + "train/classification_loss": 0.2135140597820282, + "train/contrastive_loss": 1.1043596267700195, + "train/negative_loss": 0.9168818593025208, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.18747779726982117, + "train/total_loss": 0.4343859851360321 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.21180230379104614, - "train/contrastive_loss": 2.63047194480896, - "train/negative_loss": 1.6385458707809448, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.9919260144233704, - "train/total_loss": 0.7378966808319092 + "train/classification_loss": 0.23641914129257202, + "train/contrastive_loss": 1.5262194871902466, + "train/negative_loss": 0.9449999928474426, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.581219494342804, + "train/total_loss": 0.5416630506515503 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.23444046080112457, - "train/contrastive_loss": 5.022212982177734, - "train/negative_loss": 4.493795871734619, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.5284169316291809, - "train/total_loss": 1.2388830184936523 + "train/classification_loss": 0.21804450452327728, + "train/contrastive_loss": 4.433368682861328, + "train/negative_loss": 4.43336296081543, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 5.877047897229204e-06, + "train/total_loss": 1.1047182083129883 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.25333359837532043, - "train/contrastive_loss": 3.979893445968628, - "train/negative_loss": 3.4290618896484375, + "train/classification_loss": 0.22903616726398468, + "train/contrastive_loss": 1.26973557472229, + "train/negative_loss": 1.2510457038879395, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.5508314967155457, - "train/total_loss": 1.0493123531341553 + "train/positive_loss": 0.018689824268221855, + "train/total_loss": 0.4829832911491394 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.21516290307044983, - "train/contrastive_loss": 0.7093483209609985, - "train/negative_loss": 0.7079390287399292, + "train/classification_loss": 0.2400054931640625, + "train/contrastive_loss": 2.513589382171631, + "train/negative_loss": 1.3694665431976318, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0014092717319726944, - "train/total_loss": 0.35703256726264954 + "train/num_positives": 8, + "train/positive_loss": 1.144122838973999, + "train/total_loss": 0.7427234053611755 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1886620819568634, - "train/contrastive_loss": 1.7270159721374512, - "train/negative_loss": 1.6095311641693115, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.11748479306697845, - "train/total_loss": 0.5340652465820312 + "train/classification_loss": 0.18603594601154327, + "train/contrastive_loss": 2.5822553634643555, + "train/negative_loss": 1.6960792541503906, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8861759901046753, + "train/total_loss": 0.7024869918823242 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.21739286184310913, - "train/contrastive_loss": 1.3591803312301636, - "train/negative_loss": 1.1185948848724365, - "train/num_negatives": 46, + "train/classification_loss": 0.26890575885772705, + "train/contrastive_loss": 2.616194725036621, + "train/negative_loss": 2.1009938716888428, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.24058547616004944, - "train/total_loss": 0.4892289340496063 + "train/positive_loss": 0.5152009725570679, + "train/total_loss": 0.7921447157859802 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.27971896529197693, - "train/contrastive_loss": 1.824594259262085, - "train/negative_loss": 1.824594259262085, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6446378231048584 - }, - { - "epoch": 4.562737642585551, - "eval_exact_match_accuracy": 0.2057142857142857, - "eval_hamming_loss": 0.07607843137254902, - "eval_loss": 0.6215377449989319, - "eval_macro_f1": 0.11087585082610912, - "eval_macro_precision": 0.14558756185216046, - "eval_macro_recall": 0.09297645877119683, - "eval_micro_f1": 0.4260355029585799, - "eval_micro_precision": 0.8289473684210527, - "eval_micro_recall": 0.28668941979522183, - "eval_runtime": 2.6333, - "eval_samples_per_second": 199.372, - "eval_steps_per_second": 25.064, + "train/classification_loss": 0.2412821352481842, + "train/contrastive_loss": 1.127841830253601, + "train/negative_loss": 0.8097090721130371, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.3181327283382416, + "train/total_loss": 0.46685051918029785 + }, + { + "epoch": 4.225352112676056, + "eval_exact_match_accuracy": 0.18342151675485008, + "eval_hamming_loss": 0.07666770411868451, + "eval_loss": 0.655646026134491, + "eval_macro_f1": 0.1646030455442915, + "eval_macro_precision": 0.2693936266691685, + "eval_macro_recall": 0.12418034188159713, + "eval_micro_f1": 0.38365304420350294, + "eval_micro_precision": 0.8812260536398467, + "eval_micro_recall": 0.24520255863539445, + "eval_runtime": 2.8396, + "eval_samples_per_second": 199.678, + "eval_steps_per_second": 25.004, "step": 1200 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.1630367636680603, - "train/contrastive_loss": 0.8318741917610168, - "train/negative_loss": 0.7226485013961792, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.10922569781541824, - "train/total_loss": 0.3294116258621216 + "train/classification_loss": 0.23825527727603912, + "train/contrastive_loss": 2.3279671669006348, + "train/negative_loss": 1.4855165481567383, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8424504995346069, + "train/total_loss": 0.7038487195968628 }, { - "epoch": 4.562737642585551, + "epoch": 4.225352112676056, "step": 1200, - "train/classification_loss": 0.2371024489402771, - "train/contrastive_loss": 1.2116382122039795, - "train/negative_loss": 0.937936544418335, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.27370160818099976, - "train/total_loss": 0.47943007946014404 + "train/classification_loss": 0.1869194060564041, + "train/contrastive_loss": 2.0423145294189453, + "train/negative_loss": 1.075447916984558, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.9668665528297424, + "train/total_loss": 0.5953823328018188 }, { - "epoch": 4.752851711026616, - "grad_norm": 17.564401626586914, - "learning_rate": 1.9825418569254185e-05, - "loss": 0.9046, + "epoch": 4.401408450704225, + "grad_norm": 14.286855697631836, + "learning_rate": 1.98384778012685e-05, + "loss": 0.9638, "step": 1250 }, { - "epoch": 4.752851711026616, + "epoch": 4.401408450704225, "step": 1250, - "train/classification_loss": 0.1692526787519455, - "train/contrastive_loss": 2.044642210006714, - "train/negative_loss": 1.8815244436264038, - "train/num_negatives": 24, - "train/num_positives": 32, - "train/positive_loss": 0.16311787068843842, - "train/total_loss": 0.5781811475753784 + "train/classification_loss": 0.19104373455047607, + "train/contrastive_loss": 0.6243109703063965, + "train/negative_loss": 0.6222519278526306, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.0020590173080563545, + "train/total_loss": 0.31590592861175537 }, { - "epoch": 4.752851711026616, + "epoch": 4.401408450704225, "step": 1250, - "train/classification_loss": 0.17984116077423096, - "train/contrastive_loss": 0.523725152015686, - "train/negative_loss": 0.3216233551502228, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.20210178196430206, - "train/total_loss": 0.28458619117736816 + "train/classification_loss": 0.20892855525016785, + "train/contrastive_loss": 0.9095954895019531, + "train/negative_loss": 0.4751937687397003, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4344017505645752, + "train/total_loss": 0.39084765315055847 }, { - "epoch": 4.942965779467681, - "grad_norm": 13.826289176940918, - "learning_rate": 1.9817808219178083e-05, - "loss": 0.9356, + "epoch": 4.577464788732394, + "grad_norm": 14.127750396728516, + "learning_rate": 1.9831430584918957e-05, + "loss": 0.9747, "step": 1300 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2672991156578064, - "train/contrastive_loss": 1.0850895643234253, - "train/negative_loss": 0.34369030594825745, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.7413992285728455, - "train/total_loss": 0.48431703448295593 + "train/classification_loss": 0.23401476442813873, + "train/contrastive_loss": 1.5566043853759766, + "train/negative_loss": 1.1262366771697998, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.43036770820617676, + "train/total_loss": 0.5453356504440308 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.24539868533611298, - "train/contrastive_loss": 2.482184886932373, - "train/negative_loss": 1.5057786703109741, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.9764063358306885, - "train/total_loss": 0.7418356537818909 + "train/classification_loss": 0.3032030761241913, + "train/contrastive_loss": 0.8808788657188416, + "train/negative_loss": 0.7914912700653076, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.08938758075237274, + "train/total_loss": 0.4793788492679596 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.19496262073516846, - "train/contrastive_loss": 3.4088973999023438, - "train/negative_loss": 1.6322332620620728, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.776664137840271, - "train/total_loss": 0.8767421245574951 + "train/classification_loss": 0.2706410884857178, + "train/contrastive_loss": 3.123760938644409, + "train/negative_loss": 1.550243854522705, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.573517084121704, + "train/total_loss": 0.8953933119773865 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18774834275245667, - "train/contrastive_loss": 2.0869650840759277, - "train/negative_loss": 1.3300217390060425, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.7569432854652405, - "train/total_loss": 0.6051414012908936 + "train/classification_loss": 0.15798883140087128, + "train/contrastive_loss": 1.3137962818145752, + "train/negative_loss": 0.822451114654541, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.49134519696235657, + "train/total_loss": 0.42074811458587646 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.19059738516807556, - "train/contrastive_loss": 1.097536563873291, - "train/negative_loss": 0.8176900744438171, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.27984654903411865, - "train/total_loss": 0.4101046919822693 + "train/classification_loss": 0.22797857224941254, + "train/contrastive_loss": 2.997321128845215, + "train/negative_loss": 2.844057083129883, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.15326400101184845, + "train/total_loss": 0.8274428248405457 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.20362304151058197, - "train/contrastive_loss": 2.4351911544799805, - "train/negative_loss": 1.4775639772415161, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.9576271772384644, - "train/total_loss": 0.6906612515449524 + "train/classification_loss": 0.2316315919160843, + "train/contrastive_loss": 2.246314525604248, + "train/negative_loss": 1.2781991958618164, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.9681152701377869, + "train/total_loss": 0.6808944940567017 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2527095079421997, - "train/contrastive_loss": 1.442384958267212, - "train/negative_loss": 0.935674786567688, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.5067101120948792, - "train/total_loss": 0.541186511516571 + "train/classification_loss": 0.23319797217845917, + "train/contrastive_loss": 1.6386709213256836, + "train/negative_loss": 1.2055596113204956, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.4331112802028656, + "train/total_loss": 0.5609321594238281 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18543018400669098, - "train/contrastive_loss": 1.339931607246399, - "train/negative_loss": 1.2386866807937622, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.1012449562549591, - "train/total_loss": 0.45341652631759644 + "train/classification_loss": 0.23404213786125183, + "train/contrastive_loss": 1.2143553495407104, + "train/negative_loss": 1.2142421007156372, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00011325523519190028, + "train/total_loss": 0.4769132137298584 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1738726645708084, - "train/contrastive_loss": 1.6066359281539917, - "train/negative_loss": 1.5583361387252808, + "train/classification_loss": 0.15626783668994904, + "train/contrastive_loss": 0.5440346002578735, + "train/negative_loss": 0.45632341504096985, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.04829978197813034, - "train/total_loss": 0.49519985914230347 + "train/positive_loss": 0.08771121501922607, + "train/total_loss": 0.265074759721756 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2981390953063965, - "train/contrastive_loss": 3.308047294616699, - "train/negative_loss": 1.6840907335281372, + "train/classification_loss": 0.25827547907829285, + "train/contrastive_loss": 3.0953986644744873, + "train/negative_loss": 2.4372997283935547, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.6239564418792725, - "train/total_loss": 0.9597485661506653 + "train/num_positives": 14, + "train/positive_loss": 0.6580989360809326, + "train/total_loss": 0.8773552179336548 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.21321016550064087, - "train/contrastive_loss": 1.9054371118545532, - "train/negative_loss": 1.4665374755859375, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.4388996362686157, - "train/total_loss": 0.5942975878715515 + "train/classification_loss": 0.19195662438869476, + "train/contrastive_loss": 1.2604176998138428, + "train/negative_loss": 0.9611589312553406, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.2992587685585022, + "train/total_loss": 0.4440401792526245 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1589135080575943, - "train/contrastive_loss": 1.47275972366333, - "train/negative_loss": 0.82538902759552, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.6473707556724548, - "train/total_loss": 0.45346546173095703 + "train/classification_loss": 0.21832390129566193, + "train/contrastive_loss": 2.0778255462646484, + "train/negative_loss": 1.519291639328003, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.5585338473320007, + "train/total_loss": 0.6338890194892883 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2476869821548462, - "train/contrastive_loss": 4.100563049316406, - "train/negative_loss": 1.980346918106079, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.1202163696289062, - "train/total_loss": 1.0677995681762695 + "train/classification_loss": 0.23998992145061493, + "train/contrastive_loss": 3.333832263946533, + "train/negative_loss": 1.804917335510254, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.5289148092269897, + "train/total_loss": 0.9067564010620117 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.173760786652565, - "train/contrastive_loss": 2.278841495513916, - "train/negative_loss": 2.2711021900177, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.007739389315247536, - "train/total_loss": 0.6295291185379028 + "train/classification_loss": 0.2453434020280838, + "train/contrastive_loss": 1.5505229234695435, + "train/negative_loss": 1.1107038259506226, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.4398190975189209, + "train/total_loss": 0.5554479956626892 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1619970202445984, - "train/contrastive_loss": 1.5546411275863647, - "train/negative_loss": 1.4141292572021484, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.14051185548305511, - "train/total_loss": 0.47292524576187134 + "train/classification_loss": 0.1536543369293213, + "train/contrastive_loss": 1.608515977859497, + "train/negative_loss": 0.882408618927002, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.7261072993278503, + "train/total_loss": 0.4753575325012207 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.17155300080776215, - "train/contrastive_loss": 0.7726371884346008, - "train/negative_loss": 0.5517229437828064, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.22091424465179443, - "train/total_loss": 0.32608044147491455 + "train/classification_loss": 0.2283710390329361, + "train/contrastive_loss": 1.872093677520752, + "train/negative_loss": 1.0226361751556396, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.8494575023651123, + "train/total_loss": 0.6027897596359253 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2567421495914459, - "train/contrastive_loss": 2.508636713027954, - "train/negative_loss": 1.566206932067871, - "train/num_negatives": 40, + "train/classification_loss": 0.1807592660188675, + "train/contrastive_loss": 1.440096378326416, + "train/negative_loss": 0.8546149134635925, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9424297213554382, - "train/total_loss": 0.7584694623947144 + "train/positive_loss": 0.5854814052581787, + "train/total_loss": 0.4687785506248474 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2374272644519806, - "train/contrastive_loss": 0.8635271787643433, - "train/negative_loss": 0.32061833143234253, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.5429088473320007, - "train/total_loss": 0.4101327061653137 + "train/classification_loss": 0.23544827103614807, + "train/contrastive_loss": 3.3001837730407715, + "train/negative_loss": 2.247168779373169, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.0530149936676025, + "train/total_loss": 0.8954850435256958 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2248895913362503, - "train/contrastive_loss": 1.0827058553695679, - "train/negative_loss": 1.0588452816009521, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.023860570043325424, - "train/total_loss": 0.4414307475090027 + "train/classification_loss": 0.2252124696969986, + "train/contrastive_loss": 1.0233691930770874, + "train/negative_loss": 0.8507015705108643, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.17266766726970673, + "train/total_loss": 0.4298863112926483 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18709808588027954, - "train/contrastive_loss": 2.070908546447754, - "train/negative_loss": 1.5052635669708252, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5656448602676392, - "train/total_loss": 0.6012797951698303 + "train/classification_loss": 0.19599266350269318, + "train/contrastive_loss": 2.6318631172180176, + "train/negative_loss": 1.7453365325927734, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8865267038345337, + "train/total_loss": 0.7223652601242065 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2616986036300659, - "train/contrastive_loss": 2.1968815326690674, - "train/negative_loss": 0.8816778063774109, - "train/num_negatives": 44, + "train/classification_loss": 0.1796572357416153, + "train/contrastive_loss": 2.135979652404785, + "train/negative_loss": 2.044992685317993, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3152036666870117, - "train/total_loss": 0.7010749578475952 + "train/positive_loss": 0.09098690003156662, + "train/total_loss": 0.606853187084198 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.27821773290634155, - "train/contrastive_loss": 2.377044439315796, - "train/negative_loss": 1.6032603979110718, - "train/num_negatives": 44, + "train/classification_loss": 0.15876658260822296, + "train/contrastive_loss": 2.268186092376709, + "train/negative_loss": 1.7233991622924805, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.7737840414047241, - "train/total_loss": 0.7536265850067139 + "train/positive_loss": 0.5447870492935181, + "train/total_loss": 0.6124038100242615 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.15747423470020294, - "train/contrastive_loss": 0.860465943813324, - "train/negative_loss": 0.39857813715934753, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.46188780665397644, - "train/total_loss": 0.32956743240356445 + "train/classification_loss": 0.22039884328842163, + "train/contrastive_loss": 3.5753307342529297, + "train/negative_loss": 1.9010919332504272, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.674238681793213, + "train/total_loss": 0.9354649782180786 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.15912030637264252, - "train/contrastive_loss": 0.657329797744751, - "train/negative_loss": 0.23808647692203522, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.41924330592155457, - "train/total_loss": 0.2905862629413605 + "train/classification_loss": 0.26601025462150574, + "train/contrastive_loss": 3.0995233058929443, + "train/negative_loss": 1.4762790203094482, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.623244285583496, + "train/total_loss": 0.8859149217605591 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.14338319003582, - "train/contrastive_loss": 1.1259347200393677, - "train/negative_loss": 0.9489412903785706, + "train/classification_loss": 0.20932075381278992, + "train/contrastive_loss": 1.5616726875305176, + "train/negative_loss": 0.7338090538978577, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.1769934743642807, - "train/total_loss": 0.36857014894485474 + "train/num_positives": 10, + "train/positive_loss": 0.8278636932373047, + "train/total_loss": 0.5216553211212158 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.27535226941108704, - "train/contrastive_loss": 1.8809404373168945, - "train/negative_loss": 0.5833396315574646, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2976008653640747, - "train/total_loss": 0.6515403985977173 + "train/classification_loss": 0.22062526643276215, + "train/contrastive_loss": 3.1800804138183594, + "train/negative_loss": 1.8454644680023193, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3346158266067505, + "train/total_loss": 0.8566413521766663 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2630498707294464, - "train/contrastive_loss": 2.444380760192871, - "train/negative_loss": 1.8038442134857178, + "train/classification_loss": 0.24183550477027893, + "train/contrastive_loss": 1.7665767669677734, + "train/negative_loss": 1.6985372304916382, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6405364274978638, - "train/total_loss": 0.751926064491272 + "train/num_positives": 4, + "train/positive_loss": 0.06803955137729645, + "train/total_loss": 0.5951508283615112 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2188803106546402, - "train/contrastive_loss": 2.1948680877685547, - "train/negative_loss": 1.6409235000610352, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5539445877075195, - "train/total_loss": 0.6578539609909058 + "train/classification_loss": 0.22191646695137024, + "train/contrastive_loss": 0.7853184342384338, + "train/negative_loss": 0.7448700666427612, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.04044835641980171, + "train/total_loss": 0.3789801597595215 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.21479985117912292, - "train/contrastive_loss": 1.168379306793213, - "train/negative_loss": 0.5759677886962891, - "train/num_negatives": 40, + "train/classification_loss": 0.2545104920864105, + "train/contrastive_loss": 2.4410057067871094, + "train/negative_loss": 1.145552158355713, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.592411458492279, - "train/total_loss": 0.44847571849823 + "train/positive_loss": 1.295453667640686, + "train/total_loss": 0.7427116632461548 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2356666475534439, - "train/contrastive_loss": 2.4238123893737793, - "train/negative_loss": 2.1562650203704834, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2675473690032959, - "train/total_loss": 0.7204291224479675 + "train/classification_loss": 0.253305584192276, + "train/contrastive_loss": 0.8166927099227905, + "train/negative_loss": 0.811310887336731, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.005381798837333918, + "train/total_loss": 0.4166441261768341 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.19284938275814056, - "train/contrastive_loss": 2.1719746589660645, - "train/negative_loss": 1.3377281427383423, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8342463970184326, - "train/total_loss": 0.6272442936897278 + "train/classification_loss": 0.1783934235572815, + "train/contrastive_loss": 1.362443447113037, + "train/negative_loss": 1.3614118099212646, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0010316881816834211, + "train/total_loss": 0.45088210701942444 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.24648195505142212, - "train/contrastive_loss": 3.492413282394409, - "train/negative_loss": 1.821589469909668, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.6708238124847412, - "train/total_loss": 0.9449646472930908 + "train/classification_loss": 0.2097310572862625, + "train/contrastive_loss": 2.6462390422821045, + "train/negative_loss": 1.9738372564315796, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.6724017858505249, + "train/total_loss": 0.7389788627624512 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2603757679462433, - "train/contrastive_loss": 0.9191632270812988, - "train/negative_loss": 0.9188969135284424, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0002662893966771662, - "train/total_loss": 0.44420841336250305 + "train/classification_loss": 0.21386770904064178, + "train/contrastive_loss": 1.8183174133300781, + "train/negative_loss": 1.460629940032959, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.3576875329017639, + "train/total_loss": 0.5775312185287476 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.23031623661518097, - "train/contrastive_loss": 1.5984346866607666, - "train/negative_loss": 1.3428459167480469, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.2555887699127197, - "train/total_loss": 0.550003170967102 + "train/classification_loss": 0.2335360199213028, + "train/contrastive_loss": 1.8065866231918335, + "train/negative_loss": 1.7047090530395508, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.10187755525112152, + "train/total_loss": 0.5948533415794373 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.22189201414585114, - "train/contrastive_loss": 4.308663368225098, - "train/negative_loss": 2.3792483806610107, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.9294147491455078, - "train/total_loss": 1.0836247205734253 + "train/classification_loss": 0.2644630968570709, + "train/contrastive_loss": 3.0111443996429443, + "train/negative_loss": 1.7868986129760742, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.2242457866668701, + "train/total_loss": 0.8666919469833374 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18818381428718567, - "train/contrastive_loss": 4.359396934509277, - "train/negative_loss": 1.6290926933288574, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.730304479598999, - "train/total_loss": 1.0600632429122925 + "train/classification_loss": 0.15774653851985931, + "train/contrastive_loss": 1.5923125743865967, + "train/negative_loss": 1.5920966863632202, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.00021586695220321417, + "train/total_loss": 0.47620904445648193 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18919169902801514, - "train/contrastive_loss": 1.9583799839019775, - "train/negative_loss": 1.3191421031951904, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.6392378807067871, - "train/total_loss": 0.5808677077293396 + "train/classification_loss": 0.22504517436027527, + "train/contrastive_loss": 1.5546013116836548, + "train/negative_loss": 1.1543443202972412, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.40025702118873596, + "train/total_loss": 0.5359654426574707 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.20685182511806488, - "train/contrastive_loss": 1.463133692741394, - "train/negative_loss": 1.356419563293457, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.1067141517996788, - "train/total_loss": 0.4994785785675049 + "train/classification_loss": 0.2818101644515991, + "train/contrastive_loss": 2.370673894882202, + "train/negative_loss": 2.32077956199646, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.049894239753484726, + "train/total_loss": 0.7559449672698975 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.22733446955680847, - "train/contrastive_loss": 1.4116374254226685, - "train/negative_loss": 1.3446300029754639, - "train/num_negatives": 46, + "train/classification_loss": 0.21561689674854279, + "train/contrastive_loss": 0.12947344779968262, + "train/negative_loss": 0.12818895280361176, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.0012845013989135623, + "train/total_loss": 0.24151158332824707 + }, + { + "epoch": 4.577464788732394, + "step": 1300, + "train/classification_loss": 0.2862207293510437, + "train/contrastive_loss": 4.021243095397949, + "train/negative_loss": 2.4355289936065674, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.06700743734836578, - "train/total_loss": 0.5096619725227356 + "train/positive_loss": 1.5857142210006714, + "train/total_loss": 1.0904693603515625 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.21124614775180817, - "train/contrastive_loss": 2.009889602661133, - "train/negative_loss": 2.0027387142181396, + "train/classification_loss": 0.1605284959077835, + "train/contrastive_loss": 0.9733806848526001, + "train/negative_loss": 0.7981491088867188, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.007150884252041578, - "train/total_loss": 0.6132240891456604 + "train/num_positives": 10, + "train/positive_loss": 0.17523156106472015, + "train/total_loss": 0.35520464181900024 + }, + { + "epoch": 4.577464788732394, + "step": 1300, + "train/classification_loss": 0.2003738433122635, + "train/contrastive_loss": 2.7260022163391113, + "train/negative_loss": 1.368889570236206, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.3571126461029053, + "train/total_loss": 0.7455742955207825 + }, + { + "epoch": 4.577464788732394, + "step": 1300, + "train/classification_loss": 0.23827454447746277, + "train/contrastive_loss": 0.8021093010902405, + "train/negative_loss": 0.8008567690849304, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0012525434140115976, + "train/total_loss": 0.3986964225769043 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.19748689234256744, - "train/contrastive_loss": 1.061777114868164, - "train/negative_loss": 1.0559797286987305, + "train/classification_loss": 0.26579779386520386, + "train/contrastive_loss": 1.3488194942474365, + "train/negative_loss": 1.3370717763900757, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.005797424353659153, - "train/total_loss": 0.409842312335968 + "train/positive_loss": 0.011747724376618862, + "train/total_loss": 0.5355616807937622 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.20753462612628937, - "train/contrastive_loss": 1.947122573852539, - "train/negative_loss": 1.4035279750823975, - "train/num_negatives": 36, + "train/classification_loss": 0.2275983840227127, + "train/contrastive_loss": 1.4242030382156372, + "train/negative_loss": 1.3714383840560913, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.052764710038900375, + "train/total_loss": 0.5124390125274658 + }, + { + "epoch": 4.577464788732394, + "step": 1300, + "train/classification_loss": 0.3079846203327179, + "train/contrastive_loss": 3.3644702434539795, + "train/negative_loss": 2.594789743423462, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.5435946583747864, - "train/total_loss": 0.5969591736793518 + "train/positive_loss": 0.7696805000305176, + "train/total_loss": 0.9808787107467651 + }, + { + "epoch": 4.577464788732394, + "step": 1300, + "train/classification_loss": 0.1919877976179123, + "train/contrastive_loss": 2.4588255882263184, + "train/negative_loss": 1.198575496673584, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.2602500915527344, + "train/total_loss": 0.6837528944015503 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.24824367463588715, - "train/contrastive_loss": 0.7680497169494629, - "train/negative_loss": 0.5885024070739746, + "train/classification_loss": 0.22943200170993805, + "train/contrastive_loss": 2.4177746772766113, + "train/negative_loss": 1.6359587907791138, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.17954730987548828, - "train/total_loss": 0.40185362100601196 + "train/num_positives": 14, + "train/positive_loss": 0.7818158268928528, + "train/total_loss": 0.712986946105957 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.20164887607097626, - "train/contrastive_loss": 2.727020263671875, - "train/negative_loss": 1.7220109701156616, + "train/classification_loss": 0.27851197123527527, + "train/contrastive_loss": 2.978896141052246, + "train/negative_loss": 2.9785914421081543, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.0050091743469238, - "train/total_loss": 0.7470529675483704 + "train/num_positives": 2, + "train/positive_loss": 0.00030462612630799413, + "train/total_loss": 0.874291181564331 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.16581986844539642, - "train/contrastive_loss": 1.6796553134918213, - "train/negative_loss": 0.730075478553772, + "train/classification_loss": 0.2117909938097, + "train/contrastive_loss": 1.9047844409942627, + "train/negative_loss": 1.1458433866500854, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9495798349380493, - "train/total_loss": 0.5017509460449219 + "train/num_positives": 16, + "train/positive_loss": 0.7589410543441772, + "train/total_loss": 0.5927478671073914 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.29705914855003357, - "train/contrastive_loss": 1.175432801246643, - "train/negative_loss": 1.0693796873092651, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.10605311393737793, - "train/total_loss": 0.5321457386016846 + "train/classification_loss": 0.2072007805109024, + "train/contrastive_loss": 0.7204608917236328, + "train/negative_loss": 0.685080349445343, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.035380519926548004, + "train/total_loss": 0.3512929677963257 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.15533043444156647, - "train/contrastive_loss": 1.3561255931854248, - "train/negative_loss": 1.3560829162597656, - "train/num_negatives": 48, + "train/classification_loss": 0.2516249418258667, + "train/contrastive_loss": 1.2834277153015137, + "train/negative_loss": 0.7897829413414001, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 4.261874710209668e-05, - "train/total_loss": 0.4265555739402771 + "train/positive_loss": 0.4936448037624359, + "train/total_loss": 0.5083104968070984 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.18187275528907776, - "train/contrastive_loss": 0.20535169541835785, - "train/negative_loss": 0.19765962660312653, + "train/classification_loss": 0.2277771234512329, + "train/contrastive_loss": 0.9544593095779419, + "train/negative_loss": 0.6912152171134949, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.007692062295973301, - "train/total_loss": 0.22294309735298157 + "train/num_positives": 14, + "train/positive_loss": 0.263244092464447, + "train/total_loss": 0.4186689853668213 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.16364902257919312, - "train/contrastive_loss": 1.0235378742218018, - "train/negative_loss": 0.9670833945274353, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.056454528123140335, - "train/total_loss": 0.3683565855026245 + "train/classification_loss": 0.3175206780433655, + "train/contrastive_loss": 2.5090723037719727, + "train/negative_loss": 1.6274548768997192, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.881617546081543, + "train/total_loss": 0.8193351626396179 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.236740842461586, - "train/contrastive_loss": 0.5696328282356262, - "train/negative_loss": 0.49136078357696533, - "train/num_negatives": 28, + "train/classification_loss": 0.16671912372112274, + "train/contrastive_loss": 0.7467590570449829, + "train/negative_loss": 0.6714926958084106, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.07827206701040268, - "train/total_loss": 0.35066741704940796 + "train/positive_loss": 0.07526636123657227, + "train/total_loss": 0.31607094407081604 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2073569893836975, - "train/contrastive_loss": 2.391928195953369, - "train/negative_loss": 1.5783053636550903, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8136228919029236, - "train/total_loss": 0.6857426166534424 + "train/classification_loss": 0.1625654250383377, + "train/contrastive_loss": 0.42692652344703674, + "train/negative_loss": 0.272882342338562, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.15404418110847473, + "train/total_loss": 0.2479507327079773 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1831737756729126, - "train/contrastive_loss": 0.43343278765678406, - "train/negative_loss": 0.43237021565437317, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0010625696741044521, - "train/total_loss": 0.26986032724380493 + "train/classification_loss": 0.1999031901359558, + "train/contrastive_loss": 0.9797678589820862, + "train/negative_loss": 0.9129236340522766, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.06684423238039017, + "train/total_loss": 0.3958567678928375 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.23084725439548492, - "train/contrastive_loss": 2.140575885772705, - "train/negative_loss": 1.1399478912353516, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0006279945373535, - "train/total_loss": 0.6589624285697937 + "train/classification_loss": 0.23402690887451172, + "train/contrastive_loss": 3.5618300437927246, + "train/negative_loss": 1.1926548480987549, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 2.3691751956939697, + "train/total_loss": 0.9463929533958435 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.23744191229343414, - "train/contrastive_loss": 2.729140520095825, - "train/negative_loss": 1.8760254383087158, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8531150817871094, - "train/total_loss": 0.783270001411438 + "train/classification_loss": 0.2535379230976105, + "train/contrastive_loss": 2.0842363834381104, + "train/negative_loss": 1.8566031455993652, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.2276332825422287, + "train/total_loss": 0.6703852415084839 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1935051679611206, - "train/contrastive_loss": 0.9538302421569824, - "train/negative_loss": 0.7102068066596985, + "train/classification_loss": 0.17132024466991425, + "train/contrastive_loss": 0.400510311126709, + "train/negative_loss": 0.3717068135738373, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.24362345039844513, - "train/total_loss": 0.38427120447158813 + "train/num_positives": 16, + "train/positive_loss": 0.02880351059138775, + "train/total_loss": 0.25142231583595276 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.1853124052286148, - "train/contrastive_loss": 2.819542646408081, - "train/negative_loss": 1.9992727041244507, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.8202700018882751, - "train/total_loss": 0.7492209076881409 + "train/classification_loss": 0.2238728255033493, + "train/contrastive_loss": 2.9969887733459473, + "train/negative_loss": 1.5601463317871094, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.4368423223495483, + "train/total_loss": 0.8232706189155579 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2525351047515869, - "train/contrastive_loss": 2.347477912902832, - "train/negative_loss": 1.66643488407135, + "train/classification_loss": 0.28535664081573486, + "train/contrastive_loss": 2.485658884048462, + "train/negative_loss": 2.0277631282806396, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.6810430884361267, - "train/total_loss": 0.7220306992530823 + "train/num_positives": 2, + "train/positive_loss": 0.45789575576782227, + "train/total_loss": 0.7824884653091431 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.22538906335830688, - "train/contrastive_loss": 2.286180019378662, - "train/negative_loss": 1.8927674293518066, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.393412709236145, - "train/total_loss": 0.6826250553131104 + "train/classification_loss": 0.17268261313438416, + "train/contrastive_loss": 1.8713536262512207, + "train/negative_loss": 1.5168644189834595, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.354489266872406, + "train/total_loss": 0.5469533205032349 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.19315147399902344, - "train/contrastive_loss": 2.488694190979004, - "train/negative_loss": 1.8446251153945923, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6440689563751221, - "train/total_loss": 0.6908903121948242 + "train/classification_loss": 0.21092760562896729, + "train/contrastive_loss": 0.8458287715911865, + "train/negative_loss": 0.7711238861083984, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.07470490038394928, + "train/total_loss": 0.38009336590766907 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.21234636008739471, - "train/contrastive_loss": 2.136584758758545, - "train/negative_loss": 1.6146305799484253, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5219542980194092, - "train/total_loss": 0.6396633386611938 + "train/classification_loss": 0.22525931894779205, + "train/contrastive_loss": 1.6337599754333496, + "train/negative_loss": 0.45575714111328125, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.1780028343200684, + "train/total_loss": 0.5520113110542297 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2336258590221405, - "train/contrastive_loss": 3.907989978790283, - "train/negative_loss": 3.353170394897461, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.5548194646835327, - "train/total_loss": 1.0152238607406616 + "train/classification_loss": 0.21781055629253387, + "train/contrastive_loss": 4.552392959594727, + "train/negative_loss": 4.552349090576172, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 4.367647852632217e-05, + "train/total_loss": 1.1282891035079956 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2501906752586365, - "train/contrastive_loss": 2.890026092529297, - "train/negative_loss": 2.264984130859375, + "train/classification_loss": 0.21694669127464294, + "train/contrastive_loss": 0.8992151021957397, + "train/negative_loss": 0.6574814319610596, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6250419616699219, - "train/total_loss": 0.8281959295272827 + "train/positive_loss": 0.24173367023468018, + "train/total_loss": 0.3967897295951843 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2152279019355774, - "train/contrastive_loss": 0.8655999898910522, - "train/negative_loss": 0.8651418685913086, + "train/classification_loss": 0.23654568195343018, + "train/contrastive_loss": 1.8724230527877808, + "train/negative_loss": 1.4034903049468994, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0004581510729622096, - "train/total_loss": 0.38834792375564575 + "train/num_positives": 8, + "train/positive_loss": 0.46893274784088135, + "train/total_loss": 0.6110303401947021 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.17792780697345734, - "train/contrastive_loss": 0.814980149269104, - "train/negative_loss": 0.5685877799987793, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.2463923543691635, - "train/total_loss": 0.34092384576797485 + "train/classification_loss": 0.18248401582241058, + "train/contrastive_loss": 2.415851593017578, + "train/negative_loss": 1.0401480197906494, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.3757035732269287, + "train/total_loss": 0.6656543612480164 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.2212192714214325, - "train/contrastive_loss": 2.074857711791992, - "train/negative_loss": 1.0159920454025269, - "train/num_negatives": 46, + "train/classification_loss": 0.2719835340976715, + "train/contrastive_loss": 2.2993414402008057, + "train/negative_loss": 2.076965093612671, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0588657855987549, - "train/total_loss": 0.6361908316612244 + "train/positive_loss": 0.22237637639045715, + "train/total_loss": 0.7318518161773682 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.27000370621681213, - "train/contrastive_loss": 1.68716299533844, - "train/negative_loss": 1.68716299533844, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6074362993240356 - }, - { - "epoch": 4.942965779467681, - "eval_exact_match_accuracy": 0.18857142857142858, - "eval_hamming_loss": 0.07697478991596639, - "eval_loss": 0.5944982767105103, - "eval_macro_f1": 0.10527338457746319, - "eval_macro_precision": 0.14948110318296118, - "eval_macro_recall": 0.08512900735938898, - "eval_micro_f1": 0.4062229904926534, - "eval_micro_precision": 0.8453237410071942, - "eval_micro_recall": 0.267349260523322, - "eval_runtime": 2.6312, - "eval_samples_per_second": 199.531, - "eval_steps_per_second": 25.084, + "train/classification_loss": 0.2427232563495636, + "train/contrastive_loss": 2.012882947921753, + "train/negative_loss": 1.3373515605926514, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.6755313873291016, + "train/total_loss": 0.6452998518943787 + }, + { + "epoch": 4.577464788732394, + "eval_exact_match_accuracy": 0.20105820105820105, + "eval_hamming_loss": 0.07563025210084033, + "eval_loss": 0.6144142746925354, + "eval_macro_f1": 0.16896361025951567, + "eval_macro_precision": 0.2716061903688679, + "eval_macro_recall": 0.128501009843108, + "eval_micro_f1": 0.4, + "eval_micro_precision": 0.8772563176895307, + "eval_micro_recall": 0.25906183368869934, + "eval_runtime": 2.8436, + "eval_samples_per_second": 199.398, + "eval_steps_per_second": 24.969, "step": 1300 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.20715349912643433, - "train/contrastive_loss": 1.1526392698287964, - "train/negative_loss": 0.8156041502952576, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.3370351493358612, - "train/total_loss": 0.4376813769340515 + "train/classification_loss": 0.22063268721103668, + "train/contrastive_loss": 0.9216023087501526, + "train/negative_loss": 0.7635083198547363, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.15809400379657745, + "train/total_loss": 0.40495315194129944 }, { - "epoch": 4.942965779467681, + "epoch": 4.577464788732394, "step": 1300, - "train/classification_loss": 0.16839265823364258, - "train/contrastive_loss": 0.6921669840812683, - "train/negative_loss": 0.39601951837539673, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.2961474657058716, - "train/total_loss": 0.30682605504989624 + "train/classification_loss": 0.16536462306976318, + "train/contrastive_loss": 0.5875394940376282, + "train/negative_loss": 0.5407856702804565, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.04675380885601044, + "train/total_loss": 0.2828725278377533 }, { - "epoch": 5.133079847908745, - "grad_norm": 12.847837448120117, - "learning_rate": 1.981019786910198e-05, - "loss": 0.8865, + "epoch": 4.753521126760563, + "grad_norm": 14.944501876831055, + "learning_rate": 1.982438336856942e-05, + "loss": 0.9271, "step": 1350 }, { - "epoch": 5.133079847908745, + "epoch": 4.753521126760563, "step": 1350, - "train/classification_loss": 0.20381368696689606, - "train/contrastive_loss": 1.1846051216125488, - "train/negative_loss": 0.8206002116203308, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.36400488018989563, - "train/total_loss": 0.44073471426963806 + "train/classification_loss": 0.21598052978515625, + "train/contrastive_loss": 1.0731817483901978, + "train/negative_loss": 1.0209242105484009, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.052257586270570755, + "train/total_loss": 0.4306168854236603 }, { - "epoch": 5.133079847908745, + "epoch": 4.753521126760563, "step": 1350, - "train/classification_loss": 0.12618252635002136, - "train/contrastive_loss": 1.006263256072998, - "train/negative_loss": 0.9571497440338135, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.04911347106099129, - "train/total_loss": 0.3274351954460144 + "train/classification_loss": 0.23102152347564697, + "train/contrastive_loss": 1.7591127157211304, + "train/negative_loss": 1.6203545331954956, + "train/num_negatives": 28, + "train/num_positives": 20, + "train/positive_loss": 0.13875816762447357, + "train/total_loss": 0.582844078540802 }, { - "epoch": 5.32319391634981, - "grad_norm": 13.726969718933105, - "learning_rate": 1.9802587519025876e-05, - "loss": 0.867, + "epoch": 4.929577464788732, + "grad_norm": 12.897309303283691, + "learning_rate": 1.9817336152219873e-05, + "loss": 0.9275, "step": 1400 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2615830600261688, - "train/contrastive_loss": 2.02305006980896, - "train/negative_loss": 0.8841612935066223, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.1388887166976929, - "train/total_loss": 0.6661930680274963 + "train/classification_loss": 0.23393715918064117, + "train/contrastive_loss": 1.4722117185592651, + "train/negative_loss": 1.2722023725509644, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.2000093311071396, + "train/total_loss": 0.528379499912262 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.24789822101593018, - "train/contrastive_loss": 1.8829174041748047, - "train/negative_loss": 1.1688361167907715, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.7140812277793884, - "train/total_loss": 0.6244816780090332 + "train/classification_loss": 0.2999577224254608, + "train/contrastive_loss": 1.2361167669296265, + "train/negative_loss": 0.8706927299499512, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.3654240369796753, + "train/total_loss": 0.5471810698509216 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.1863137036561966, - "train/contrastive_loss": 2.202282428741455, - "train/negative_loss": 0.8011972904205322, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.4010850191116333, - "train/total_loss": 0.6267701983451843 + "train/classification_loss": 0.25975456833839417, + "train/contrastive_loss": 2.3680732250213623, + "train/negative_loss": 1.2489418983459473, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.119131326675415, + "train/total_loss": 0.7333692312240601 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.19273261725902557, - "train/contrastive_loss": 2.963813304901123, - "train/negative_loss": 2.417818546295166, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.5459948182106018, - "train/total_loss": 0.7854952812194824 + "train/classification_loss": 0.15801315009593964, + "train/contrastive_loss": 0.7145366072654724, + "train/negative_loss": 0.6202155351638794, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.09432106465101242, + "train/total_loss": 0.3009204864501953 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18653996288776398, - "train/contrastive_loss": 2.7597742080688477, - "train/negative_loss": 2.387730836868286, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.372043251991272, - "train/total_loss": 0.7384948134422302 + "train/classification_loss": 0.21140454709529877, + "train/contrastive_loss": 2.6877408027648926, + "train/negative_loss": 2.503927230834961, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.18381357192993164, + "train/total_loss": 0.7489527463912964 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20117434859275818, - "train/contrastive_loss": 1.7952840328216553, - "train/negative_loss": 1.2378432750701904, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.5574406981468201, - "train/total_loss": 0.5602311491966248 + "train/classification_loss": 0.22213847935199738, + "train/contrastive_loss": 2.550034999847412, + "train/negative_loss": 1.4603843688964844, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0896506309509277, + "train/total_loss": 0.7321454882621765 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2553505003452301, - "train/contrastive_loss": 1.1892261505126953, - "train/negative_loss": 0.959560215473175, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.22966596484184265, - "train/total_loss": 0.49319571256637573 + "train/classification_loss": 0.20857639610767365, + "train/contrastive_loss": 2.272698402404785, + "train/negative_loss": 1.4846333265304565, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.7880651354789734, + "train/total_loss": 0.6631160974502563 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.17589586973190308, - "train/contrastive_loss": 1.11697256565094, - "train/negative_loss": 1.0259848833084106, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.09098769724369049, - "train/total_loss": 0.39929038286209106 + "train/classification_loss": 0.22684897482395172, + "train/contrastive_loss": 0.9840952754020691, + "train/negative_loss": 0.9840511679649353, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 4.4108408474130556e-05, + "train/total_loss": 0.4236680269241333 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.1703890711069107, - "train/contrastive_loss": 1.8117637634277344, - "train/negative_loss": 1.4861793518066406, + "train/classification_loss": 0.1542213410139084, + "train/contrastive_loss": 0.6024507284164429, + "train/negative_loss": 0.543899655342102, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.32558444142341614, - "train/total_loss": 0.5327418446540833 + "train/positive_loss": 0.058551084250211716, + "train/total_loss": 0.2747114896774292 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.3062739968299866, - "train/contrastive_loss": 3.403672933578491, - "train/negative_loss": 1.849557638168335, + "train/classification_loss": 0.2476825714111328, + "train/contrastive_loss": 3.0360355377197266, + "train/negative_loss": 1.9377377033233643, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.5541152954101562, - "train/total_loss": 0.9870085716247559 + "train/num_positives": 14, + "train/positive_loss": 1.0982978343963623, + "train/total_loss": 0.8548896908760071 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20118823647499084, - "train/contrastive_loss": 1.1976510286331177, - "train/negative_loss": 0.9414138197898865, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.2562371790409088, - "train/total_loss": 0.4407184422016144 + "train/classification_loss": 0.1866694837808609, + "train/contrastive_loss": 1.3327810764312744, + "train/negative_loss": 0.9623618125915527, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3704192340373993, + "train/total_loss": 0.4532257318496704 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.15554864704608917, - "train/contrastive_loss": 1.0694890022277832, - "train/negative_loss": 0.7510858178138733, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.3184032440185547, - "train/total_loss": 0.36944645643234253 + "train/classification_loss": 0.21355567872524261, + "train/contrastive_loss": 1.8908418416976929, + "train/negative_loss": 1.8872884511947632, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.003553333692252636, + "train/total_loss": 0.5917240381240845 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.24908247590065002, - "train/contrastive_loss": 3.0534048080444336, - "train/negative_loss": 2.5366592407226562, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5167456865310669, - "train/total_loss": 0.859763503074646 + "train/classification_loss": 0.24093280732631683, + "train/contrastive_loss": 3.631753921508789, + "train/negative_loss": 2.140901565551758, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.4908523559570312, + "train/total_loss": 0.9672836065292358 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.16630233824253082, - "train/contrastive_loss": 2.007511615753174, - "train/negative_loss": 1.998839020729065, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.008672541007399559, - "train/total_loss": 0.5678046941757202 + "train/classification_loss": 0.23973363637924194, + "train/contrastive_loss": 1.4302055835723877, + "train/negative_loss": 1.3044441938400269, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.12576135993003845, + "train/total_loss": 0.5257747173309326 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.15795864164829254, - "train/contrastive_loss": 1.999880075454712, - "train/negative_loss": 1.363979458808899, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.6359006762504578, - "train/total_loss": 0.5579346418380737 + "train/classification_loss": 0.15119034051895142, + "train/contrastive_loss": 2.565791368484497, + "train/negative_loss": 0.7071977257728577, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.8585937023162842, + "train/total_loss": 0.6643486022949219 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.16668033599853516, - "train/contrastive_loss": 0.5617552399635315, - "train/negative_loss": 0.5555193424224854, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.006235912907868624, - "train/total_loss": 0.2790313959121704 + "train/classification_loss": 0.20661590993404388, + "train/contrastive_loss": 1.4633798599243164, + "train/negative_loss": 0.785781979560852, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.6775978803634644, + "train/total_loss": 0.49929189682006836 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.240486741065979, - "train/contrastive_loss": 2.1037795543670654, - "train/negative_loss": 1.6308869123458862, - "train/num_negatives": 40, + "train/classification_loss": 0.17302308976650238, + "train/contrastive_loss": 1.5027965307235718, + "train/negative_loss": 1.095802903175354, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.472892701625824, - "train/total_loss": 0.661242663860321 + "train/positive_loss": 0.4069935977458954, + "train/total_loss": 0.47358238697052 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.220224991440773, - "train/contrastive_loss": 1.3090722560882568, - "train/negative_loss": 0.21553462743759155, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.09353768825531, - "train/total_loss": 0.4820394515991211 + "train/classification_loss": 0.20444808900356293, + "train/contrastive_loss": 1.4097462892532349, + "train/negative_loss": 1.1200119256973267, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.2897343337535858, + "train/total_loss": 0.48639732599258423 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.23242653906345367, - "train/contrastive_loss": 1.8405430316925049, - "train/negative_loss": 1.839255690574646, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0012873370433226228, - "train/total_loss": 0.6005351543426514 + "train/classification_loss": 0.22217759490013123, + "train/contrastive_loss": 1.3416063785552979, + "train/negative_loss": 1.2977246046066284, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.04388182982802391, + "train/total_loss": 0.4904988706111908 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18661300837993622, - "train/contrastive_loss": 3.133199453353882, - "train/negative_loss": 0.9118657112121582, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 2.2213337421417236, - "train/total_loss": 0.8132529258728027 + "train/classification_loss": 0.19605687260627747, + "train/contrastive_loss": 3.1035685539245605, + "train/negative_loss": 1.8977183103561401, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.20585036277771, + "train/total_loss": 0.8167705535888672 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.26445871591567993, - "train/contrastive_loss": 2.6412243843078613, - "train/negative_loss": 1.186860203742981, - "train/num_negatives": 44, + "train/classification_loss": 0.17438937723636627, + "train/contrastive_loss": 1.1631836891174316, + "train/negative_loss": 1.144606351852417, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.4543641805648804, - "train/total_loss": 0.7927036285400391 + "train/positive_loss": 0.018577340990304947, + "train/total_loss": 0.40702611207962036 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2701681852340698, - "train/contrastive_loss": 1.7600022554397583, - "train/negative_loss": 1.5431441068649292, - "train/num_negatives": 44, + "train/classification_loss": 0.14891044795513153, + "train/contrastive_loss": 1.7904173135757446, + "train/negative_loss": 1.5921657085418701, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.21685810387134552, - "train/total_loss": 0.6221686601638794 + "train/positive_loss": 0.1982516199350357, + "train/total_loss": 0.5069938898086548 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.14993156492710114, - "train/contrastive_loss": 0.623949408531189, - "train/negative_loss": 0.21898964047431946, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.4049597382545471, - "train/total_loss": 0.2747214436531067 + "train/classification_loss": 0.2139759659767151, + "train/contrastive_loss": 3.727570056915283, + "train/negative_loss": 1.7804551124572754, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.9471148252487183, + "train/total_loss": 0.9594900012016296 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.15490852296352386, - "train/contrastive_loss": 0.31422314047813416, - "train/negative_loss": 0.254720002412796, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.059503134340047836, - "train/total_loss": 0.21775314211845398 + "train/classification_loss": 0.2626914083957672, + "train/contrastive_loss": 2.6890525817871094, + "train/negative_loss": 1.2976715564727783, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.391381025314331, + "train/total_loss": 0.8005019426345825 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.13691763579845428, - "train/contrastive_loss": 1.0543084144592285, - "train/negative_loss": 0.886838436126709, + "train/classification_loss": 0.19910500943660736, + "train/contrastive_loss": 1.7909460067749023, + "train/negative_loss": 0.870284914970398, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.1674700230360031, - "train/total_loss": 0.3477793335914612 + "train/num_positives": 10, + "train/positive_loss": 0.9206610918045044, + "train/total_loss": 0.5572941899299622 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.26271912455558777, - "train/contrastive_loss": 0.8706082105636597, - "train/negative_loss": 0.4358740746974945, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.43473416566848755, - "train/total_loss": 0.4368407726287842 + "train/classification_loss": 0.2213013619184494, + "train/contrastive_loss": 3.4536094665527344, + "train/negative_loss": 2.116147041320801, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3374624252319336, + "train/total_loss": 0.9120233058929443 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2564815580844879, - "train/contrastive_loss": 2.3176651000976562, - "train/negative_loss": 1.6614866256713867, + "train/classification_loss": 0.23854103684425354, + "train/contrastive_loss": 1.6801559925079346, + "train/negative_loss": 1.675628423690796, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6561784148216248, - "train/total_loss": 0.7200145721435547 + "train/num_positives": 4, + "train/positive_loss": 0.004527554847300053, + "train/total_loss": 0.5745722055435181 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.21024855971336365, - "train/contrastive_loss": 2.5089821815490723, - "train/negative_loss": 1.9837161302566528, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5252659320831299, - "train/total_loss": 0.7120449542999268 + "train/classification_loss": 0.21013152599334717, + "train/contrastive_loss": 0.3212376534938812, + "train/negative_loss": 0.3000991940498352, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.021138465031981468, + "train/total_loss": 0.27437907457351685 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20810312032699585, - "train/contrastive_loss": 0.8019324541091919, - "train/negative_loss": 0.5802662372589111, - "train/num_negatives": 40, + "train/classification_loss": 0.2551615238189697, + "train/contrastive_loss": 2.024010181427002, + "train/negative_loss": 0.9517756104469299, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.22166620194911957, - "train/total_loss": 0.3684896230697632 + "train/positive_loss": 1.0722346305847168, + "train/total_loss": 0.6599636077880859 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.23325859010219574, - "train/contrastive_loss": 2.2339203357696533, - "train/negative_loss": 1.2669094800949097, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.9670108556747437, - "train/total_loss": 0.6800426840782166 + "train/classification_loss": 0.24212419986724854, + "train/contrastive_loss": 0.7657091021537781, + "train/negative_loss": 0.7523344159126282, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.013374675996601582, + "train/total_loss": 0.39526602625846863 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18063890933990479, - "train/contrastive_loss": 1.994586706161499, - "train/negative_loss": 0.8382356762886047, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.156351089477539, - "train/total_loss": 0.5795562267303467 + "train/classification_loss": 0.1769164353609085, + "train/contrastive_loss": 1.89718496799469, + "train/negative_loss": 1.8965978622436523, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0005871434696018696, + "train/total_loss": 0.5563534498214722 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.24477431178092957, - "train/contrastive_loss": 2.870698928833008, - "train/negative_loss": 1.6100449562072754, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.260654091835022, - "train/total_loss": 0.8189140558242798 + "train/classification_loss": 0.20006434619426727, + "train/contrastive_loss": 3.621943712234497, + "train/negative_loss": 2.390413999557495, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.231529712677002, + "train/total_loss": 0.9244531393051147 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.25434163212776184, - "train/contrastive_loss": 0.8172174692153931, - "train/negative_loss": 0.8143876194953918, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0028298564720898867, - "train/total_loss": 0.417785108089447 + "train/classification_loss": 0.21074402332305908, + "train/contrastive_loss": 2.6736202239990234, + "train/negative_loss": 1.5347355604171753, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.1388845443725586, + "train/total_loss": 0.7454680800437927 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2281278520822525, - "train/contrastive_loss": 2.6342861652374268, - "train/negative_loss": 1.2270288467407227, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.407257318496704, - "train/total_loss": 0.7549850940704346 + "train/classification_loss": 0.23172606527805328, + "train/contrastive_loss": 1.8997231721878052, + "train/negative_loss": 1.5308058261871338, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.368917316198349, + "train/total_loss": 0.611670732498169 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.21400688588619232, - "train/contrastive_loss": 3.911576271057129, - "train/negative_loss": 1.9929203987121582, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.9186559915542603, - "train/total_loss": 0.9963221549987793 + "train/classification_loss": 0.24845577776432037, + "train/contrastive_loss": 1.744419813156128, + "train/negative_loss": 1.3105539083480835, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.43386590480804443, + "train/total_loss": 0.5973397493362427 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18613727390766144, - "train/contrastive_loss": 2.453258991241455, - "train/negative_loss": 1.2741819620132446, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.1790771484375, - "train/total_loss": 0.6767891049385071 + "train/classification_loss": 0.16125430166721344, + "train/contrastive_loss": 2.1428160667419434, + "train/negative_loss": 1.9983477592468262, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.14446841180324554, + "train/total_loss": 0.5898175239562988 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.17933331429958344, - "train/contrastive_loss": 1.0905709266662598, - "train/negative_loss": 0.9223586916923523, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.1682121902704239, - "train/total_loss": 0.39744749665260315 + "train/classification_loss": 0.23195935785770416, + "train/contrastive_loss": 1.6570932865142822, + "train/negative_loss": 1.1011319160461426, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.5559613108634949, + "train/total_loss": 0.5633780360221863 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2027289718389511, - "train/contrastive_loss": 1.3253800868988037, - "train/negative_loss": 1.1005429029464722, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.22483713924884796, - "train/total_loss": 0.4678049683570862 + "train/classification_loss": 0.26865336298942566, + "train/contrastive_loss": 3.343217611312866, + "train/negative_loss": 2.9467906951904297, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.3964269161224365, + "train/total_loss": 0.9372968673706055 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.23409044742584229, - "train/contrastive_loss": 2.1552093029022217, - "train/negative_loss": 2.1076836585998535, - "train/num_negatives": 46, + "train/classification_loss": 0.21648384630680084, + "train/contrastive_loss": 1.1829619407653809, + "train/negative_loss": 0.5028421878814697, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.6801196932792664, + "train/total_loss": 0.45307624340057373 + }, + { + "epoch": 4.929577464788732, + "step": 1400, + "train/classification_loss": 0.28715255856513977, + "train/contrastive_loss": 3.8815360069274902, + "train/negative_loss": 1.99509596824646, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.047525666654109955, - "train/total_loss": 0.6651322841644287 + "train/positive_loss": 1.8864400386810303, + "train/total_loss": 1.0634597539901733 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20971526205539703, - "train/contrastive_loss": 1.5825802087783813, - "train/negative_loss": 1.5595290660858154, + "train/classification_loss": 0.15984392166137695, + "train/contrastive_loss": 1.2444604635238647, + "train/negative_loss": 0.7440666556358337, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.02305115945637226, - "train/total_loss": 0.5262312889099121 + "train/num_positives": 10, + "train/positive_loss": 0.500393807888031, + "train/total_loss": 0.4087360203266144 + }, + { + "epoch": 4.929577464788732, + "step": 1400, + "train/classification_loss": 0.1855562925338745, + "train/contrastive_loss": 1.7380281686782837, + "train/negative_loss": 1.3140361309051514, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.42399200797080994, + "train/total_loss": 0.5331619381904602 + }, + { + "epoch": 4.929577464788732, + "step": 1400, + "train/classification_loss": 0.22104769945144653, + "train/contrastive_loss": 1.1489006280899048, + "train/negative_loss": 1.1484401226043701, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0004604670684784651, + "train/total_loss": 0.45082783699035645 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18506687879562378, - "train/contrastive_loss": 0.661515474319458, - "train/negative_loss": 0.6595361828804016, + "train/classification_loss": 0.2730380594730377, + "train/contrastive_loss": 1.5600128173828125, + "train/negative_loss": 1.4715052843093872, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.001979269552975893, - "train/total_loss": 0.3173699975013733 + "train/positive_loss": 0.08850748836994171, + "train/total_loss": 0.5850406289100647 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.19836899638175964, - "train/contrastive_loss": 1.2748968601226807, - "train/negative_loss": 1.2401374578475952, - "train/num_negatives": 36, + "train/classification_loss": 0.2212018519639969, + "train/contrastive_loss": 1.9971472024917603, + "train/negative_loss": 1.3740453720092773, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.6231018304824829, + "train/total_loss": 0.6206312775611877 + }, + { + "epoch": 4.929577464788732, + "step": 1400, + "train/classification_loss": 0.2970312535762787, + "train/contrastive_loss": 2.325863838195801, + "train/negative_loss": 1.122704267501831, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.03475942090153694, - "train/total_loss": 0.4533483684062958 + "train/positive_loss": 1.2031596899032593, + "train/total_loss": 0.7622040510177612 + }, + { + "epoch": 4.929577464788732, + "step": 1400, + "train/classification_loss": 0.19004490971565247, + "train/contrastive_loss": 3.3516011238098145, + "train/negative_loss": 1.4583089351654053, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.8932920694351196, + "train/total_loss": 0.8603651523590088 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.23820456862449646, - "train/contrastive_loss": 1.138126015663147, - "train/negative_loss": 0.5975877046585083, + "train/classification_loss": 0.22262173891067505, + "train/contrastive_loss": 2.6947569847106934, + "train/negative_loss": 2.2964460849761963, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.5405383110046387, - "train/total_loss": 0.4658297896385193 + "train/num_positives": 14, + "train/positive_loss": 0.39831095933914185, + "train/total_loss": 0.7615731358528137 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20265349745750427, - "train/contrastive_loss": 2.652071475982666, - "train/negative_loss": 1.2271381616592407, + "train/classification_loss": 0.2667829394340515, + "train/contrastive_loss": 2.5166549682617188, + "train/negative_loss": 2.516644239425659, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4249331951141357, - "train/total_loss": 0.7330677509307861 + "train/num_positives": 2, + "train/positive_loss": 1.0728893357736524e-05, + "train/total_loss": 0.7701139450073242 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.16533184051513672, - "train/contrastive_loss": 1.4138803482055664, - "train/negative_loss": 0.8274204134941101, + "train/classification_loss": 0.20589295029640198, + "train/contrastive_loss": 1.7858270406723022, + "train/negative_loss": 1.328407883644104, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5864599347114563, - "train/total_loss": 0.44810792803764343 + "train/num_positives": 16, + "train/positive_loss": 0.45741915702819824, + "train/total_loss": 0.5630583763122559 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.3001149594783783, - "train/contrastive_loss": 1.5137439966201782, - "train/negative_loss": 1.4765738248825073, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.03717018663883209, - "train/total_loss": 0.6028637886047363 + "train/classification_loss": 0.19719679653644562, + "train/contrastive_loss": 0.6879628300666809, + "train/negative_loss": 0.6219642758369446, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.06599855422973633, + "train/total_loss": 0.33478936553001404 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.15420083701610565, - "train/contrastive_loss": 1.1335591077804565, - "train/negative_loss": 1.1332674026489258, - "train/num_negatives": 48, + "train/classification_loss": 0.23205526173114777, + "train/contrastive_loss": 0.7114622592926025, + "train/negative_loss": 0.5853481888771057, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.00029174581868574023, - "train/total_loss": 0.3809126615524292 + "train/positive_loss": 0.12611407041549683, + "train/total_loss": 0.3743477165699005 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.17593583464622498, - "train/contrastive_loss": 0.24660232663154602, - "train/negative_loss": 0.24215632677078247, + "train/classification_loss": 0.23155814409255981, + "train/contrastive_loss": 1.034451961517334, + "train/negative_loss": 0.8554577231407166, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.004445997532457113, - "train/total_loss": 0.2252562940120697 + "train/num_positives": 14, + "train/positive_loss": 0.17899425327777863, + "train/total_loss": 0.43844854831695557 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.16412989795207977, - "train/contrastive_loss": 1.1565595865249634, - "train/negative_loss": 0.9386652708053589, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.2178942710161209, - "train/total_loss": 0.39544183015823364 + "train/classification_loss": 0.3008689880371094, + "train/contrastive_loss": 1.319309115409851, + "train/negative_loss": 1.1135939359664917, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.205715149641037, + "train/total_loss": 0.5647308230400085 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.234500914812088, - "train/contrastive_loss": 1.990515112876892, - "train/negative_loss": 1.6671044826507568, - "train/num_negatives": 28, + "train/classification_loss": 0.16647109389305115, + "train/contrastive_loss": 0.9486055970191956, + "train/negative_loss": 0.8614486455917358, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.32341060042381287, - "train/total_loss": 0.6326039433479309 + "train/positive_loss": 0.08715693652629852, + "train/total_loss": 0.3561922311782837 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.20513677597045898, - "train/contrastive_loss": 2.0771307945251465, - "train/negative_loss": 0.9234853386878967, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.153645396232605, - "train/total_loss": 0.6205629110336304 + "train/classification_loss": 0.15506407618522644, + "train/contrastive_loss": 0.5729125142097473, + "train/negative_loss": 0.3452664017677307, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.2276460975408554, + "train/total_loss": 0.2696465849876404 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18384720385074615, - "train/contrastive_loss": 0.41552749276161194, - "train/negative_loss": 0.41289621591567993, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.002631284762173891, - "train/total_loss": 0.2669526934623718 + "train/classification_loss": 0.19409959018230438, + "train/contrastive_loss": 0.7444077134132385, + "train/negative_loss": 0.7230579853057861, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.02134970761835575, + "train/total_loss": 0.34298112988471985 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.21186231076717377, - "train/contrastive_loss": 2.3514602184295654, - "train/negative_loss": 0.6709760427474976, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.6804841756820679, - "train/total_loss": 0.6821543574333191 + "train/classification_loss": 0.22766001522541046, + "train/contrastive_loss": 2.6191601753234863, + "train/negative_loss": 1.266123652458191, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.3530365228652954, + "train/total_loss": 0.7514920234680176 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2338688224554062, - "train/contrastive_loss": 2.024965524673462, - "train/negative_loss": 0.9493040442466736, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.075661540031433, - "train/total_loss": 0.6388619542121887 + "train/classification_loss": 0.22966733574867249, + "train/contrastive_loss": 0.7468936443328857, + "train/negative_loss": 0.6868898272514343, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.060003843158483505, + "train/total_loss": 0.37904608249664307 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.1962486207485199, - "train/contrastive_loss": 1.9644200801849365, - "train/negative_loss": 0.7483246922492981, + "train/classification_loss": 0.16529713571071625, + "train/contrastive_loss": 0.5958980321884155, + "train/negative_loss": 0.37662050127983093, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.2160953283309937, - "train/total_loss": 0.5891326665878296 + "train/num_positives": 16, + "train/positive_loss": 0.2192775458097458, + "train/total_loss": 0.28447675704956055 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.18690218031406403, - "train/contrastive_loss": 3.0509345531463623, - "train/negative_loss": 1.690335988998413, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3605985641479492, - "train/total_loss": 0.7970890998840332 + "train/classification_loss": 0.2148972749710083, + "train/contrastive_loss": 2.1638331413269043, + "train/negative_loss": 1.1603425741195679, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.003490686416626, + "train/total_loss": 0.647663950920105 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.24043448269367218, - "train/contrastive_loss": 2.7969751358032227, - "train/negative_loss": 1.4084162712097168, + "train/classification_loss": 0.27717262506484985, + "train/contrastive_loss": 1.8546534776687622, + "train/negative_loss": 1.818279504776001, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.3885587453842163, - "train/total_loss": 0.7998294830322266 + "train/num_positives": 2, + "train/positive_loss": 0.03637393191456795, + "train/total_loss": 0.6481033563613892 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2247655838727951, - "train/contrastive_loss": 2.2181785106658936, - "train/negative_loss": 1.5634263753890991, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6547521352767944, - "train/total_loss": 0.668401300907135 + "train/classification_loss": 0.1601891815662384, + "train/contrastive_loss": 2.100324869155884, + "train/negative_loss": 1.5401709079742432, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.5601539611816406, + "train/total_loss": 0.5802541971206665 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.19849370419979095, - "train/contrastive_loss": 2.6212351322174072, - "train/negative_loss": 1.7411000728607178, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8801351189613342, - "train/total_loss": 0.7227407693862915 + "train/classification_loss": 0.2267373651266098, + "train/contrastive_loss": 2.0910134315490723, + "train/negative_loss": 1.3800240755081177, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.7109894752502441, + "train/total_loss": 0.6449400782585144 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.22658240795135498, - "train/contrastive_loss": 2.8916215896606445, - "train/negative_loss": 1.743910789489746, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.1477106809616089, - "train/total_loss": 0.8049067258834839 + "train/classification_loss": 0.22092710435390472, + "train/contrastive_loss": 1.2995631694793701, + "train/negative_loss": 0.5123441815376282, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.7872190475463867, + "train/total_loss": 0.48083972930908203 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.22981946170330048, - "train/contrastive_loss": 5.05959415435791, - "train/negative_loss": 3.808274269104004, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.2513201236724854, - "train/total_loss": 1.2417383193969727 + "train/classification_loss": 0.21065887808799744, + "train/contrastive_loss": 5.21412992477417, + "train/negative_loss": 5.214123725891113, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 6.163147190818563e-06, + "train/total_loss": 1.2534849643707275 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2556140124797821, - "train/contrastive_loss": 2.9514644145965576, - "train/negative_loss": 1.919101595878601, + "train/classification_loss": 0.209507018327713, + "train/contrastive_loss": 1.1888965368270874, + "train/negative_loss": 0.6046951413154602, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.0323628187179565, - "train/total_loss": 0.8459068536758423 + "train/positive_loss": 0.5842013955116272, + "train/total_loss": 0.44728630781173706 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2114701122045517, - "train/contrastive_loss": 0.9767836928367615, - "train/negative_loss": 0.9464170336723328, + "train/classification_loss": 0.24194557964801788, + "train/contrastive_loss": 2.0317795276641846, + "train/negative_loss": 1.567382574081421, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.030366651713848114, - "train/total_loss": 0.40682685375213623 + "train/num_positives": 8, + "train/positive_loss": 0.4643968939781189, + "train/total_loss": 0.6483014822006226 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.17964428663253784, - "train/contrastive_loss": 1.517561912536621, - "train/negative_loss": 0.6343120336532593, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.883249819278717, - "train/total_loss": 0.483156681060791 + "train/classification_loss": 0.1839798092842102, + "train/contrastive_loss": 3.1929068565368652, + "train/negative_loss": 1.279168725013733, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.9137382507324219, + "train/total_loss": 0.8225612044334412 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.198362797498703, - "train/contrastive_loss": 1.1947895288467407, - "train/negative_loss": 0.7933563590049744, - "train/num_negatives": 46, + "train/classification_loss": 0.2763615846633911, + "train/contrastive_loss": 2.311007499694824, + "train/negative_loss": 2.2773032188415527, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.40143319964408875, - "train/total_loss": 0.4373207092285156 + "train/positive_loss": 0.033704303205013275, + "train/total_loss": 0.738563060760498 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.2631293833255768, - "train/contrastive_loss": 1.4999243021011353, - "train/negative_loss": 1.4999243021011353, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5631142854690552 - }, - { - "epoch": 5.32319391634981, - "eval_exact_match_accuracy": 0.2019047619047619, - "eval_hamming_loss": 0.07607843137254902, - "eval_loss": 0.587147057056427, - "eval_macro_f1": 0.12020123059794742, - "eval_macro_precision": 0.26615714386112865, - "eval_macro_recall": 0.09501405155684811, - "eval_micro_f1": 0.4221276595744681, - "eval_micro_precision": 0.8378378378378378, - "eval_micro_recall": 0.2821387940841866, - "eval_runtime": 2.6351, - "eval_samples_per_second": 199.237, - "eval_steps_per_second": 25.047, + "train/classification_loss": 0.21757225692272186, + "train/contrastive_loss": 1.919898509979248, + "train/negative_loss": 1.5635740756988525, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.35632437467575073, + "train/total_loss": 0.6015519499778748 + }, + { + "epoch": 4.929577464788732, + "eval_exact_match_accuracy": 0.20634920634920634, + "eval_hamming_loss": 0.0742815644776429, + "eval_loss": 0.602698802947998, + "eval_macro_f1": 0.18039899366294992, + "eval_macro_precision": 0.26815441057420997, + "eval_macro_recall": 0.1408294182448942, + "eval_micro_f1": 0.42902711323763953, + "eval_micro_precision": 0.8512658227848101, + "eval_micro_recall": 0.2867803837953092, + "eval_runtime": 2.8408, + "eval_samples_per_second": 199.593, + "eval_steps_per_second": 24.993, "step": 1400 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.19161900877952576, - "train/contrastive_loss": 1.211616039276123, - "train/negative_loss": 1.1582905054092407, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.053325533866882324, - "train/total_loss": 0.43394219875335693 + "train/classification_loss": 0.22136974334716797, + "train/contrastive_loss": 1.2682056427001953, + "train/negative_loss": 1.1588491201400757, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.10935650765895844, + "train/total_loss": 0.47501087188720703 }, { - "epoch": 5.32319391634981, + "epoch": 4.929577464788732, "step": 1400, - "train/classification_loss": 0.22547754645347595, - "train/contrastive_loss": 0.7988379597663879, - "train/negative_loss": 0.6050838828086853, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.19375407695770264, - "train/total_loss": 0.385245144367218 + "train/classification_loss": 0.19550098478794098, + "train/contrastive_loss": 1.2021019458770752, + "train/negative_loss": 1.0115691423416138, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.19053274393081665, + "train/total_loss": 0.4359213709831238 }, { - "epoch": 5.513307984790875, - "grad_norm": 8.573578834533691, - "learning_rate": 1.9794977168949774e-05, - "loss": 0.8903, + "epoch": 5.105633802816901, + "grad_norm": 15.724308013916016, + "learning_rate": 1.981028893587033e-05, + "loss": 0.8954, "step": 1450 }, { - "epoch": 5.513307984790875, + "epoch": 5.105633802816901, "step": 1450, - "train/classification_loss": 0.21811936795711517, - "train/contrastive_loss": 1.0516337156295776, - "train/negative_loss": 0.7482859492301941, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.30334779620170593, - "train/total_loss": 0.42844611406326294 + "train/classification_loss": 0.18994148075580597, + "train/contrastive_loss": 1.1352885961532593, + "train/negative_loss": 0.6845282912254333, + "train/num_negatives": 32, + "train/num_positives": 24, + "train/positive_loss": 0.4507603347301483, + "train/total_loss": 0.4169992208480835 }, { - "epoch": 5.513307984790875, + "epoch": 5.105633802816901, "step": 1450, - "train/classification_loss": 0.20088213682174683, - "train/contrastive_loss": 2.2192068099975586, - "train/negative_loss": 1.2442798614501953, - "train/num_negatives": 52, + "train/classification_loss": 0.22752925753593445, + "train/contrastive_loss": 0.7950844764709473, + "train/negative_loss": 0.7596084475517273, + "train/num_negatives": 50, "train/num_positives": 4, - "train/positive_loss": 0.9749270081520081, - "train/total_loss": 0.6447235345840454 + "train/positive_loss": 0.03547599911689758, + "train/total_loss": 0.38654613494873047 }, { - "epoch": 5.7034220532319395, - "grad_norm": 16.019466400146484, - "learning_rate": 1.978736681887367e-05, - "loss": 0.9107, + "epoch": 5.28169014084507, + "grad_norm": 14.44680118560791, + "learning_rate": 1.9803241719520793e-05, + "loss": 0.8702, "step": 1500 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.27763721346855164, - "train/contrastive_loss": 2.2862582206726074, - "train/negative_loss": 1.8190003633499146, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.4672577381134033, - "train/total_loss": 0.7348888516426086 + "train/classification_loss": 0.22636128962039948, + "train/contrastive_loss": 2.0414843559265137, + "train/negative_loss": 1.6787714958190918, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3627128601074219, + "train/total_loss": 0.63465815782547 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.24440829455852509, - "train/contrastive_loss": 2.197031021118164, - "train/negative_loss": 1.5310004949569702, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.6660306453704834, - "train/total_loss": 0.683814525604248 + "train/classification_loss": 0.2975652515888214, + "train/contrastive_loss": 0.7430849671363831, + "train/negative_loss": 0.6191623210906982, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.12392264604568481, + "train/total_loss": 0.4461822509765625 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1811717450618744, - "train/contrastive_loss": 2.2234344482421875, - "train/negative_loss": 1.1282936334609985, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0951409339904785, - "train/total_loss": 0.6258586645126343 + "train/classification_loss": 0.26759234070777893, + "train/contrastive_loss": 2.839524269104004, + "train/negative_loss": 1.739831566810608, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.0996925830841064, + "train/total_loss": 0.835497260093689 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20157553255558014, - "train/contrastive_loss": 3.0962743759155273, - "train/negative_loss": 2.2215394973754883, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.8747347593307495, - "train/total_loss": 0.8208304047584534 + "train/classification_loss": 0.1427876055240631, + "train/contrastive_loss": 0.6630963087081909, + "train/negative_loss": 0.5745147466659546, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.08858159184455872, + "train/total_loss": 0.2754068672657013 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.17735347151756287, - "train/contrastive_loss": 1.772950530052185, - "train/negative_loss": 1.5978354215621948, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.17511510848999023, - "train/total_loss": 0.5319435596466064 + "train/classification_loss": 0.21467840671539307, + "train/contrastive_loss": 2.688988208770752, + "train/negative_loss": 2.3859636783599854, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.3030245006084442, + "train/total_loss": 0.7524760365486145 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20716600120067596, - "train/contrastive_loss": 1.8318309783935547, - "train/negative_loss": 1.459362268447876, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.3724687397480011, - "train/total_loss": 0.573532223701477 + "train/classification_loss": 0.2218104600906372, + "train/contrastive_loss": 2.84360408782959, + "train/negative_loss": 1.8320857286453247, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0115182399749756, + "train/total_loss": 0.7905312776565552 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.26938626170158386, - "train/contrastive_loss": 2.1318612098693848, - "train/negative_loss": 2.0514304637908936, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.08043073117733002, - "train/total_loss": 0.6957585215568542 + "train/classification_loss": 0.22064198553562164, + "train/contrastive_loss": 2.234194755554199, + "train/negative_loss": 1.4630733728408813, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.7711214423179626, + "train/total_loss": 0.6674809455871582 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18177254498004913, - "train/contrastive_loss": 1.8001869916915894, - "train/negative_loss": 1.5574724674224854, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.24271447956562042, - "train/total_loss": 0.5418099761009216 + "train/classification_loss": 0.217738538980484, + "train/contrastive_loss": 0.8700132966041565, + "train/negative_loss": 0.8698275089263916, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00018580493633635342, + "train/total_loss": 0.39174121618270874 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1671236753463745, - "train/contrastive_loss": 2.048607587814331, - "train/negative_loss": 1.6759345531463623, + "train/classification_loss": 0.13523893058300018, + "train/contrastive_loss": 0.6919322609901428, + "train/negative_loss": 0.4435657262802124, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.37267303466796875, - "train/total_loss": 0.5768451690673828 + "train/positive_loss": 0.24836653470993042, + "train/total_loss": 0.27362537384033203 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.292933851480484, - "train/contrastive_loss": 3.2774548530578613, - "train/negative_loss": 2.258448839187622, + "train/classification_loss": 0.24660545587539673, + "train/contrastive_loss": 2.9734978675842285, + "train/negative_loss": 1.8433940410614014, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0190060138702393, - "train/total_loss": 0.9484248161315918 + "train/num_positives": 14, + "train/positive_loss": 1.1301038265228271, + "train/total_loss": 0.8413050174713135 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2054361253976822, - "train/contrastive_loss": 2.135164737701416, - "train/negative_loss": 1.8419955968856812, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.2931691110134125, - "train/total_loss": 0.6324690580368042 + "train/classification_loss": 0.18715506792068481, + "train/contrastive_loss": 2.116032123565674, + "train/negative_loss": 1.181221604347229, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.9348105192184448, + "train/total_loss": 0.6103614568710327 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.14833243191242218, - "train/contrastive_loss": 1.2633388042449951, - "train/negative_loss": 0.5886877775192261, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.674651026725769, - "train/total_loss": 0.4010002017021179 + "train/classification_loss": 0.20544745028018951, + "train/contrastive_loss": 1.607175588607788, + "train/negative_loss": 1.1987271308898926, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.4084485173225403, + "train/total_loss": 0.5268825888633728 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.248979851603508, - "train/contrastive_loss": 3.6900634765625, - "train/negative_loss": 2.228654623031616, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4614089727401733, - "train/total_loss": 0.986992597579956 + "train/classification_loss": 0.22728942334651947, + "train/contrastive_loss": 3.931039810180664, + "train/negative_loss": 2.4261186122894287, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.5049210786819458, + "train/total_loss": 1.0134973526000977 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.15964797139167786, - "train/contrastive_loss": 1.1651129722595215, - "train/negative_loss": 1.1641379594802856, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0009750400204211473, - "train/total_loss": 0.39267057180404663 + "train/classification_loss": 0.2303304374217987, + "train/contrastive_loss": 1.6849133968353271, + "train/negative_loss": 1.6026890277862549, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.08222441375255585, + "train/total_loss": 0.5673131346702576 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1599956750869751, - "train/contrastive_loss": 1.9312505722045898, - "train/negative_loss": 1.6541595458984375, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.27709102630615234, - "train/total_loss": 0.546245813369751 + "train/classification_loss": 0.1550561934709549, + "train/contrastive_loss": 2.964245319366455, + "train/negative_loss": 0.9514899253845215, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.0127553939819336, + "train/total_loss": 0.7479052543640137 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.163163959980011, - "train/contrastive_loss": 0.8370791673660278, - "train/negative_loss": 0.6387070417404175, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.19837211072444916, - "train/total_loss": 0.33057981729507446 + "train/classification_loss": 0.2042667418718338, + "train/contrastive_loss": 2.0260186195373535, + "train/negative_loss": 1.2843199968338013, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.741698682308197, + "train/total_loss": 0.6094704866409302 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2409946769475937, - "train/contrastive_loss": 3.006478786468506, - "train/negative_loss": 2.140543222427368, - "train/num_negatives": 40, + "train/classification_loss": 0.16754163801670074, + "train/contrastive_loss": 1.4737792015075684, + "train/negative_loss": 0.8898117542266846, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8659354448318481, - "train/total_loss": 0.842290461063385 + "train/positive_loss": 0.5839675068855286, + "train/total_loss": 0.4622974991798401 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.21131537854671478, - "train/contrastive_loss": 1.1115062236785889, - "train/negative_loss": 0.47040891647338867, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.641097366809845, - "train/total_loss": 0.43361663818359375 + "train/classification_loss": 0.21145936846733093, + "train/contrastive_loss": 1.7176973819732666, + "train/negative_loss": 0.9128689765930176, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.8048284649848938, + "train/total_loss": 0.5549988746643066 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.22413836419582367, - "train/contrastive_loss": 2.1546149253845215, - "train/negative_loss": 1.6531447172164917, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.5014702081680298, - "train/total_loss": 0.6550613641738892 + "train/classification_loss": 0.20649760961532593, + "train/contrastive_loss": 0.8787757158279419, + "train/negative_loss": 0.3985722064971924, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.4802034795284271, + "train/total_loss": 0.3822527527809143 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18086524307727814, - "train/contrastive_loss": 2.8034608364105225, - "train/negative_loss": 2.1243748664855957, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.679085910320282, - "train/total_loss": 0.7415574193000793 + "train/classification_loss": 0.19489778578281403, + "train/contrastive_loss": 3.086888313293457, + "train/negative_loss": 1.646887183189392, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.440001130104065, + "train/total_loss": 0.8122754693031311 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2600420117378235, - "train/contrastive_loss": 2.16593599319458, - "train/negative_loss": 1.1975301504135132, - "train/num_negatives": 44, + "train/classification_loss": 0.16930510103702545, + "train/contrastive_loss": 1.041625738143921, + "train/negative_loss": 0.9929075241088867, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.9684059023857117, - "train/total_loss": 0.6932291984558105 + "train/positive_loss": 0.04871825501322746, + "train/total_loss": 0.37763023376464844 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2614686191082001, - "train/contrastive_loss": 2.6197562217712402, - "train/negative_loss": 1.9190077781677246, - "train/num_negatives": 44, + "train/classification_loss": 0.14430966973304749, + "train/contrastive_loss": 2.8742356300354004, + "train/negative_loss": 1.8458573818206787, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.7007484436035156, - "train/total_loss": 0.7854198217391968 + "train/positive_loss": 1.0283783674240112, + "train/total_loss": 0.7191568613052368 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.15055491030216217, - "train/contrastive_loss": 1.1265367269515991, - "train/negative_loss": 0.6381794214248657, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.488357275724411, - "train/total_loss": 0.3758622407913208 + "train/classification_loss": 0.19273817539215088, + "train/contrastive_loss": 2.236297369003296, + "train/negative_loss": 1.3599917888641357, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.8763055801391602, + "train/total_loss": 0.639997661113739 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.15287110209465027, - "train/contrastive_loss": 0.9126694202423096, - "train/negative_loss": 0.2787471413612366, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.633922278881073, - "train/total_loss": 0.33540499210357666 + "train/classification_loss": 0.24937298893928528, + "train/contrastive_loss": 2.778104066848755, + "train/negative_loss": 1.426579236984253, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.351524829864502, + "train/total_loss": 0.8049938678741455 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1351831704378128, - "train/contrastive_loss": 1.9774311780929565, - "train/negative_loss": 1.3963886499404907, + "train/classification_loss": 0.18907541036605835, + "train/contrastive_loss": 1.5253593921661377, + "train/negative_loss": 0.7853926420211792, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5810425281524658, - "train/total_loss": 0.5306693911552429 + "train/num_positives": 10, + "train/positive_loss": 0.7399666905403137, + "train/total_loss": 0.49414730072021484 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.26803967356681824, - "train/contrastive_loss": 1.5272318124771118, - "train/negative_loss": 0.8430303931236267, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.6842014193534851, - "train/total_loss": 0.5734860301017761 + "train/classification_loss": 0.22384776175022125, + "train/contrastive_loss": 3.009986162185669, + "train/negative_loss": 1.789249300956726, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.2207368612289429, + "train/total_loss": 0.8258450031280518 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.27102479338645935, - "train/contrastive_loss": 3.1129093170166016, - "train/negative_loss": 1.4395638704299927, + "train/classification_loss": 0.2237471491098404, + "train/contrastive_loss": 1.8612817525863647, + "train/negative_loss": 1.8601264953613281, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.6733453273773193, - "train/total_loss": 0.8936066627502441 + "train/num_positives": 4, + "train/positive_loss": 0.0011552752694115043, + "train/total_loss": 0.596003532409668 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2141820788383484, - "train/contrastive_loss": 2.9452402591705322, - "train/negative_loss": 2.6086409091949463, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.3365994095802307, - "train/total_loss": 0.8032301664352417 + "train/classification_loss": 0.20967324078083038, + "train/contrastive_loss": 0.21053670346736908, + "train/negative_loss": 0.19599571824073792, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.014540987089276314, + "train/total_loss": 0.25178056955337524 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20600999891757965, - "train/contrastive_loss": 1.3836517333984375, - "train/negative_loss": 0.7732595801353455, - "train/num_negatives": 40, + "train/classification_loss": 0.25641560554504395, + "train/contrastive_loss": 2.2025504112243652, + "train/negative_loss": 1.0668914318084717, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6103922128677368, - "train/total_loss": 0.4827403426170349 + "train/positive_loss": 1.135659098625183, + "train/total_loss": 0.696925699710846 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.23181456327438354, - "train/contrastive_loss": 1.7242013216018677, - "train/negative_loss": 1.5291553735733032, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.19504594802856445, - "train/total_loss": 0.5766547918319702 + "train/classification_loss": 0.23944158852100372, + "train/contrastive_loss": 1.1535974740982056, + "train/negative_loss": 1.1365643739700317, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.017033154144883156, + "train/total_loss": 0.4701610803604126 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.17067471146583557, - "train/contrastive_loss": 1.3714947700500488, - "train/negative_loss": 0.778760552406311, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5927342772483826, - "train/total_loss": 0.4449736773967743 + "train/classification_loss": 0.16724729537963867, + "train/contrastive_loss": 1.302540898323059, + "train/negative_loss": 1.3008681535720825, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0016727934125810862, + "train/total_loss": 0.4277554750442505 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.24365724623203278, - "train/contrastive_loss": 1.9125930070877075, - "train/negative_loss": 1.1724003553390503, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7401926517486572, - "train/total_loss": 0.6261758804321289 + "train/classification_loss": 0.1996653825044632, + "train/contrastive_loss": 3.8614325523376465, + "train/negative_loss": 2.305530548095703, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.5559020042419434, + "train/total_loss": 0.9719519019126892 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.25836262106895447, - "train/contrastive_loss": 1.0988633632659912, - "train/negative_loss": 1.0981329679489136, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007303639431484044, - "train/total_loss": 0.47813528776168823 + "train/classification_loss": 0.21217036247253418, + "train/contrastive_loss": 2.384697437286377, + "train/negative_loss": 0.9175740480422974, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.4671235084533691, + "train/total_loss": 0.6891098618507385 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.21884332597255707, - "train/contrastive_loss": 1.8757169246673584, - "train/negative_loss": 1.3165854215621948, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.5591315031051636, - "train/total_loss": 0.5939866900444031 + "train/classification_loss": 0.2223367691040039, + "train/contrastive_loss": 2.0807347297668457, + "train/negative_loss": 1.5713911056518555, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.5093435645103455, + "train/total_loss": 0.6384837627410889 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.214738130569458, - "train/contrastive_loss": 2.971015453338623, - "train/negative_loss": 2.127578020095825, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8434373736381531, - "train/total_loss": 0.8089412450790405 + "train/classification_loss": 0.25095394253730774, + "train/contrastive_loss": 3.321063995361328, + "train/negative_loss": 1.9911603927612305, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.329903483390808, + "train/total_loss": 0.9151667356491089 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1829337328672409, - "train/contrastive_loss": 3.6934814453125, - "train/negative_loss": 1.5756124258041382, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.1178691387176514, - "train/total_loss": 0.9216300249099731 + "train/classification_loss": 0.1524108201265335, + "train/contrastive_loss": 2.1531994342803955, + "train/negative_loss": 2.153045177459717, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.0001543389807920903, + "train/total_loss": 0.5830507278442383 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18691465258598328, - "train/contrastive_loss": 1.6776552200317383, - "train/negative_loss": 1.2855075597763062, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.3921476900577545, - "train/total_loss": 0.5224456787109375 + "train/classification_loss": 0.21389931440353394, + "train/contrastive_loss": 1.0181796550750732, + "train/negative_loss": 0.6149943470954895, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.40318524837493896, + "train/total_loss": 0.4175352454185486 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20408523082733154, - "train/contrastive_loss": 1.3487032651901245, - "train/negative_loss": 1.2983390092849731, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.050364281982183456, - "train/total_loss": 0.4738259017467499 + "train/classification_loss": 0.27000924944877625, + "train/contrastive_loss": 2.7042622566223145, + "train/negative_loss": 2.2667722702026367, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.43748992681503296, + "train/total_loss": 0.8108617067337036 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.22791829705238342, - "train/contrastive_loss": 1.8635659217834473, - "train/negative_loss": 1.7879486083984375, - "train/num_negatives": 46, + "train/classification_loss": 0.21009594202041626, + "train/contrastive_loss": 0.4851546883583069, + "train/negative_loss": 0.38059118390083313, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.10456349700689316, + "train/total_loss": 0.30712687969207764 + }, + { + "epoch": 5.28169014084507, + "step": 1500, + "train/classification_loss": 0.2787434160709381, + "train/contrastive_loss": 3.513895034790039, + "train/negative_loss": 2.2333409786224365, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.07561735808849335, - "train/total_loss": 0.6006314754486084 + "train/positive_loss": 1.280554175376892, + "train/total_loss": 0.9815224409103394 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20144492387771606, - "train/contrastive_loss": 1.9024699926376343, - "train/negative_loss": 1.8620316982269287, + "train/classification_loss": 0.15372511744499207, + "train/contrastive_loss": 1.4948574304580688, + "train/negative_loss": 0.8530688285827637, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.04043826088309288, - "train/total_loss": 0.5819389224052429 + "train/num_positives": 10, + "train/positive_loss": 0.6417886018753052, + "train/total_loss": 0.45269662141799927 + }, + { + "epoch": 5.28169014084507, + "step": 1500, + "train/classification_loss": 0.1950065940618515, + "train/contrastive_loss": 3.4712212085723877, + "train/negative_loss": 2.2971549034118652, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.1740663051605225, + "train/total_loss": 0.8892508745193481 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18482808768749237, - "train/contrastive_loss": 0.8901057243347168, - "train/negative_loss": 0.7888711094856262, + "train/classification_loss": 0.21279451251029968, + "train/contrastive_loss": 1.0096569061279297, + "train/negative_loss": 1.0092675685882568, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0003893813118338585, + "train/total_loss": 0.4147258996963501 + }, + { + "epoch": 5.28169014084507, + "step": 1500, + "train/classification_loss": 0.2675437331199646, + "train/contrastive_loss": 1.8837124109268188, + "train/negative_loss": 1.8820476531982422, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.10123460739850998, - "train/total_loss": 0.36284923553466797 + "train/positive_loss": 0.0016647394513711333, + "train/total_loss": 0.6442862153053284 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2074083834886551, - "train/contrastive_loss": 2.2853479385375977, - "train/negative_loss": 2.0549991130828857, - "train/num_negatives": 36, + "train/classification_loss": 0.21745339035987854, + "train/contrastive_loss": 0.950171172618866, + "train/negative_loss": 0.6876944899559021, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.26247668266296387, + "train/total_loss": 0.4074876308441162 + }, + { + "epoch": 5.28169014084507, + "step": 1500, + "train/classification_loss": 0.3117443025112152, + "train/contrastive_loss": 2.8014614582061768, + "train/negative_loss": 2.127279043197632, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.23034892976284027, - "train/total_loss": 0.6644780039787292 + "train/positive_loss": 0.6741823554039001, + "train/total_loss": 0.8720365762710571 + }, + { + "epoch": 5.28169014084507, + "step": 1500, + "train/classification_loss": 0.17777502536773682, + "train/contrastive_loss": 1.4357764720916748, + "train/negative_loss": 1.0680173635482788, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.36775916814804077, + "train/total_loss": 0.46493032574653625 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.24222570657730103, - "train/contrastive_loss": 1.028113603591919, - "train/negative_loss": 0.4427121579647064, + "train/classification_loss": 0.22267363965511322, + "train/contrastive_loss": 2.5921692848205566, + "train/negative_loss": 1.7946677207946777, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.5854014754295349, - "train/total_loss": 0.44784843921661377 + "train/num_positives": 14, + "train/positive_loss": 0.7975016236305237, + "train/total_loss": 0.7411075234413147 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18792380392551422, - "train/contrastive_loss": 2.233563184738159, - "train/negative_loss": 1.5940258502960205, + "train/classification_loss": 0.2684362232685089, + "train/contrastive_loss": 2.321204900741577, + "train/negative_loss": 2.321115493774414, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6395372748374939, - "train/total_loss": 0.6346364617347717 + "train/num_positives": 2, + "train/positive_loss": 8.929174509830773e-05, + "train/total_loss": 0.7326772212982178 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.16255562007427216, - "train/contrastive_loss": 1.7516610622406006, - "train/negative_loss": 1.1576484441757202, + "train/classification_loss": 0.19712282717227936, + "train/contrastive_loss": 2.233785390853882, + "train/negative_loss": 1.603864312171936, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5940126180648804, - "train/total_loss": 0.5128878355026245 + "train/num_positives": 16, + "train/positive_loss": 0.629921019077301, + "train/total_loss": 0.6438798904418945 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2775709927082062, - "train/contrastive_loss": 1.8695780038833618, - "train/negative_loss": 1.8563990592956543, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.013178929686546326, - "train/total_loss": 0.6514866352081299 + "train/classification_loss": 0.1858803778886795, + "train/contrastive_loss": 0.6894663572311401, + "train/negative_loss": 0.44342461228370667, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.24604175984859467, + "train/total_loss": 0.32377365231513977 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.14470866322517395, - "train/contrastive_loss": 1.1293716430664062, - "train/negative_loss": 1.1266734600067139, - "train/num_negatives": 48, + "train/classification_loss": 0.24126358330249786, + "train/contrastive_loss": 0.5397908091545105, + "train/negative_loss": 0.47343602776527405, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0026982089038938284, - "train/total_loss": 0.3705829977989197 + "train/positive_loss": 0.06635475903749466, + "train/total_loss": 0.34922173619270325 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.17150087654590607, - "train/contrastive_loss": 0.7085525989532471, - "train/negative_loss": 0.22313492000102997, + "train/classification_loss": 0.22538423538208008, + "train/contrastive_loss": 1.0500423908233643, + "train/negative_loss": 0.770239531993866, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.4854176640510559, - "train/total_loss": 0.3132113814353943 + "train/num_positives": 14, + "train/positive_loss": 0.2798028886318207, + "train/total_loss": 0.43539273738861084 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.14805036783218384, - "train/contrastive_loss": 0.6224093437194824, - "train/negative_loss": 0.5918495655059814, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.030559783801436424, - "train/total_loss": 0.27253222465515137 + "train/classification_loss": 0.3079920709133148, + "train/contrastive_loss": 1.9762444496154785, + "train/negative_loss": 1.3747068643569946, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.6015375256538391, + "train/total_loss": 0.7032409906387329 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.21981260180473328, - "train/contrastive_loss": 0.695090651512146, - "train/negative_loss": 0.4862945079803467, - "train/num_negatives": 28, + "train/classification_loss": 0.1529608517885208, + "train/contrastive_loss": 0.5382075905799866, + "train/negative_loss": 0.5331097841262817, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.20879612863063812, - "train/total_loss": 0.3588307499885559 + "train/positive_loss": 0.005097777582705021, + "train/total_loss": 0.26060235500335693 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.19312843680381775, - "train/contrastive_loss": 1.9793723821640015, - "train/negative_loss": 0.8770608901977539, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1023114919662476, - "train/total_loss": 0.5890029072761536 + "train/classification_loss": 0.1508939117193222, + "train/contrastive_loss": 0.7440985441207886, + "train/negative_loss": 0.2530116140842438, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.4910869300365448, + "train/total_loss": 0.2997136116027832 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18536293506622314, - "train/contrastive_loss": 1.05420982837677, - "train/negative_loss": 0.9447280168533325, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1094818115234375, - "train/total_loss": 0.3962048888206482 + "train/classification_loss": 0.1866835653781891, + "train/contrastive_loss": 0.9746546745300293, + "train/negative_loss": 0.906044602394104, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.0686100572347641, + "train/total_loss": 0.3816145062446594 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2108427733182907, - "train/contrastive_loss": 3.157905101776123, - "train/negative_loss": 1.1135808229446411, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 2.0443243980407715, - "train/total_loss": 0.8424237966537476 + "train/classification_loss": 0.2201661467552185, + "train/contrastive_loss": 2.9372711181640625, + "train/negative_loss": 1.0342472791671753, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.9030237197875977, + "train/total_loss": 0.8076204061508179 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.23744668066501617, - "train/contrastive_loss": 2.583112955093384, - "train/negative_loss": 1.4942703247070312, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.0888426303863525, - "train/total_loss": 0.7540692687034607 + "train/classification_loss": 0.22550223767757416, + "train/contrastive_loss": 1.3420944213867188, + "train/negative_loss": 1.223663568496704, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.11843083798885345, + "train/total_loss": 0.49392110109329224 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18903079628944397, - "train/contrastive_loss": 0.8778753280639648, - "train/negative_loss": 0.43684282898902893, + "train/classification_loss": 0.15391422808170319, + "train/contrastive_loss": 0.3427361845970154, + "train/negative_loss": 0.18869996070861816, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.4410324990749359, - "train/total_loss": 0.3646058440208435 + "train/num_positives": 16, + "train/positive_loss": 0.15403620898723602, + "train/total_loss": 0.22246146202087402 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.18006089329719543, - "train/contrastive_loss": 2.627274513244629, - "train/negative_loss": 1.6210675239562988, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.00620698928833, - "train/total_loss": 0.7055158615112305 + "train/classification_loss": 0.20097817480564117, + "train/contrastive_loss": 2.4801955223083496, + "train/negative_loss": 1.040342926979065, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.4398527145385742, + "train/total_loss": 0.6970173120498657 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.250312477350235, - "train/contrastive_loss": 2.930715799331665, - "train/negative_loss": 1.3351229429244995, + "train/classification_loss": 0.2750329375267029, + "train/contrastive_loss": 2.6431326866149902, + "train/negative_loss": 2.556562662124634, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.5955928564071655, - "train/total_loss": 0.8364557027816772 + "train/num_positives": 2, + "train/positive_loss": 0.0865701362490654, + "train/total_loss": 0.8036594986915588 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2157830148935318, - "train/contrastive_loss": 1.3912602663040161, - "train/negative_loss": 1.0858333110809326, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.3054269850254059, - "train/total_loss": 0.4940350651741028 + "train/classification_loss": 0.16166841983795166, + "train/contrastive_loss": 3.3219175338745117, + "train/negative_loss": 1.5956919193267822, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.726225733757019, + "train/total_loss": 0.8260519504547119 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.21217362582683563, - "train/contrastive_loss": 3.0415380001068115, - "train/negative_loss": 1.9323755502700806, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.109162449836731, - "train/total_loss": 0.8204812407493591 + "train/classification_loss": 0.22442971169948578, + "train/contrastive_loss": 1.8916311264038086, + "train/negative_loss": 1.7948410511016846, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.09679010510444641, + "train/total_loss": 0.6027559638023376 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.21574124693870544, - "train/contrastive_loss": 2.642425060272217, - "train/negative_loss": 1.6951442956924438, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.9472807049751282, - "train/total_loss": 0.7442262172698975 + "train/classification_loss": 0.21694506704807281, + "train/contrastive_loss": 1.2165296077728271, + "train/negative_loss": 0.7232502102851868, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.4932793378829956, + "train/total_loss": 0.46025097370147705 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2439928650856018, - "train/contrastive_loss": 3.378657341003418, - "train/negative_loss": 2.68117618560791, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.697481095790863, - "train/total_loss": 0.9197243452072144 + "train/classification_loss": 0.20899632573127747, + "train/contrastive_loss": 5.260756969451904, + "train/negative_loss": 5.260749816894531, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 7.224129603855545e-06, + "train/total_loss": 1.2611477375030518 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.24362020194530487, - "train/contrastive_loss": 2.4703893661499023, - "train/negative_loss": 1.8761485815048218, + "train/classification_loss": 0.20686830580234528, + "train/contrastive_loss": 0.7166347503662109, + "train/negative_loss": 0.3884955048561096, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.5942407846450806, - "train/total_loss": 0.7376980781555176 + "train/positive_loss": 0.3281392753124237, + "train/total_loss": 0.3501952588558197 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.20744740962982178, - "train/contrastive_loss": 0.950239896774292, - "train/negative_loss": 0.9495099782943726, + "train/classification_loss": 0.2344495803117752, + "train/contrastive_loss": 2.4842820167541504, + "train/negative_loss": 1.4722728729248047, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0007299109129235148, - "train/total_loss": 0.3974953889846802 + "train/num_positives": 8, + "train/positive_loss": 1.0120090246200562, + "train/total_loss": 0.7313060164451599 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1762300729751587, - "train/contrastive_loss": 1.1651244163513184, - "train/negative_loss": 0.776850700378418, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.3882737159729004, - "train/total_loss": 0.4092549681663513 + "train/classification_loss": 0.17630720138549805, + "train/contrastive_loss": 2.585228204727173, + "train/negative_loss": 1.4172074794769287, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.1680207252502441, + "train/total_loss": 0.6933528780937195 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.1966848224401474, - "train/contrastive_loss": 1.3103623390197754, - "train/negative_loss": 0.9152129888534546, - "train/num_negatives": 46, + "train/classification_loss": 0.26748135685920715, + "train/contrastive_loss": 2.0368354320526123, + "train/negative_loss": 1.9325711727142334, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.3951493501663208, - "train/total_loss": 0.45875728130340576 + "train/positive_loss": 0.1042642742395401, + "train/total_loss": 0.6748484373092651 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.2556271255016327, - "train/contrastive_loss": 1.6118662357330322, - "train/negative_loss": 1.6118662357330322, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5780003666877747 - }, - { - "epoch": 5.7034220532319395, - "eval_exact_match_accuracy": 0.19428571428571428, - "eval_hamming_loss": 0.07708683473389356, - "eval_loss": 0.5976338386535645, - "eval_macro_f1": 0.13741040679934885, - "eval_macro_precision": 0.3013222936233317, - "eval_macro_recall": 0.10346686647569328, - "eval_micro_f1": 0.41196581196581195, - "eval_micro_precision": 0.8281786941580757, - "eval_micro_recall": 0.27417519908987487, - "eval_runtime": 2.6296, - "eval_samples_per_second": 199.649, - "eval_steps_per_second": 25.099, + "train/classification_loss": 0.20691922307014465, + "train/contrastive_loss": 0.979591429233551, + "train/negative_loss": 0.8532407879829407, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.12635065615177155, + "train/total_loss": 0.40283751487731934 + }, + { + "epoch": 5.28169014084507, + "eval_exact_match_accuracy": 0.2239858906525573, + "eval_hamming_loss": 0.07262164124909223, + "eval_loss": 0.6040080785751343, + "eval_macro_f1": 0.19772493885278988, + "eval_macro_precision": 0.3197474920333325, + "eval_macro_recall": 0.15588829677088895, + "eval_micro_f1": 0.45054945054945056, + "eval_micro_precision": 0.8541666666666666, + "eval_micro_recall": 0.30597014925373134, + "eval_runtime": 2.8406, + "eval_samples_per_second": 199.605, + "eval_steps_per_second": 24.995, "step": 1500 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.24454966187477112, - "train/contrastive_loss": 1.3606679439544678, - "train/negative_loss": 1.3178895711898804, + "train/classification_loss": 0.21017411351203918, + "train/contrastive_loss": 1.1640411615371704, + "train/negative_loss": 0.8045998811721802, "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.04277839884161949, - "train/total_loss": 0.5166832208633423 + "train/num_positives": 10, + "train/positive_loss": 0.35944128036499023, + "train/total_loss": 0.44298234581947327 }, { - "epoch": 5.7034220532319395, + "epoch": 5.28169014084507, "step": 1500, - "train/classification_loss": 0.14403048157691956, - "train/contrastive_loss": 0.8303778767585754, - "train/negative_loss": 0.585578441619873, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.2447994500398636, - "train/total_loss": 0.3101060390472412 + "train/classification_loss": 0.21734820306301117, + "train/contrastive_loss": 0.6913052201271057, + "train/negative_loss": 0.6011077761650085, + "train/num_negatives": 36, + "train/num_positives": 16, + "train/positive_loss": 0.09019742906093597, + "train/total_loss": 0.3556092381477356 }, { - "epoch": 5.893536121673003, - "grad_norm": 10.709308624267578, - "learning_rate": 1.9779756468797567e-05, - "loss": 0.8632, + "epoch": 5.457746478873239, + "grad_norm": 11.561055183410645, + "learning_rate": 1.9796194503171248e-05, + "loss": 0.8382, "step": 1550 }, { - "epoch": 5.893536121673003, + "epoch": 5.457746478873239, "step": 1550, - "train/classification_loss": 0.2201460599899292, - "train/contrastive_loss": 1.2947051525115967, - "train/negative_loss": 0.7099259495735168, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5847792625427246, - "train/total_loss": 0.47908708453178406 + "train/classification_loss": 0.22216124832630157, + "train/contrastive_loss": 1.2040032148361206, + "train/negative_loss": 0.7773630023002625, + "train/num_negatives": 24, + "train/num_positives": 18, + "train/positive_loss": 0.42664018273353577, + "train/total_loss": 0.46296191215515137 }, { - "epoch": 5.893536121673003, + "epoch": 5.457746478873239, "step": 1550, - "train/classification_loss": 0.27261024713516235, - "train/contrastive_loss": 2.0624051094055176, - "train/negative_loss": 1.3653761148452759, - "train/num_negatives": 36, - "train/num_positives": 10, - "train/positive_loss": 0.6970290541648865, - "train/total_loss": 0.6850912570953369 + "train/classification_loss": 0.25321558117866516, + "train/contrastive_loss": 1.0504286289215088, + "train/negative_loss": 0.7849107980728149, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 0.2655177712440491, + "train/total_loss": 0.46330130100250244 }, { - "epoch": 6.083650190114068, - "grad_norm": 21.121591567993164, - "learning_rate": 1.9772146118721462e-05, - "loss": 0.8554, + "epoch": 5.633802816901408, + "grad_norm": 16.24932861328125, + "learning_rate": 1.9789147286821706e-05, + "loss": 0.8582, "step": 1600 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2679643929004669, - "train/contrastive_loss": 1.8381534814834595, - "train/negative_loss": 1.1142867803573608, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.7238667011260986, - "train/total_loss": 0.6355950832366943 + "train/classification_loss": 0.23702077567577362, + "train/contrastive_loss": 1.6451088190078735, + "train/negative_loss": 1.5508790016174316, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.09422986209392548, + "train/total_loss": 0.5660425424575806 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.23385880887508392, - "train/contrastive_loss": 2.204223871231079, - "train/negative_loss": 1.0108118057250977, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.1934120655059814, - "train/total_loss": 0.6747035980224609 + "train/classification_loss": 0.2807944416999817, + "train/contrastive_loss": 1.4290659427642822, + "train/negative_loss": 0.5341874361038208, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.8948785662651062, + "train/total_loss": 0.5666075944900513 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.17987164855003357, - "train/contrastive_loss": 2.2157654762268066, - "train/negative_loss": 1.377975583076477, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8377898335456848, - "train/total_loss": 0.6230247616767883 + "train/classification_loss": 0.2671695053577423, + "train/contrastive_loss": 2.3894972801208496, + "train/negative_loss": 1.2943984270095825, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.0950989723205566, + "train/total_loss": 0.7450689673423767 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19711458683013916, - "train/contrastive_loss": 2.6370697021484375, - "train/negative_loss": 1.3420010805130005, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2950685024261475, - "train/total_loss": 0.7245285511016846 + "train/classification_loss": 0.13481146097183228, + "train/contrastive_loss": 0.5420774221420288, + "train/negative_loss": 0.48649072647094727, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.055586669594049454, + "train/total_loss": 0.24322694540023804 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.17512686550617218, - "train/contrastive_loss": 2.0600128173828125, - "train/negative_loss": 1.9748681783676147, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.0851445198059082, - "train/total_loss": 0.5871294140815735 + "train/classification_loss": 0.21328222751617432, + "train/contrastive_loss": 2.6036579608917236, + "train/negative_loss": 2.0069971084594727, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.596660852432251, + "train/total_loss": 0.7340138554573059 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.18789641559123993, - "train/contrastive_loss": 1.748475193977356, - "train/negative_loss": 1.2833327054977417, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.46514245867729187, - "train/total_loss": 0.5375914573669434 + "train/classification_loss": 0.21861054003238678, + "train/contrastive_loss": 2.874683141708374, + "train/negative_loss": 1.37449312210083, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.500190019607544, + "train/total_loss": 0.7935471534729004 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2543294131755829, - "train/contrastive_loss": 1.605653166770935, - "train/negative_loss": 1.5085455179214478, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.09710760414600372, - "train/total_loss": 0.5754600763320923 + "train/classification_loss": 0.2072199136018753, + "train/contrastive_loss": 2.2234437465667725, + "train/negative_loss": 1.3584762811660767, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.864967405796051, + "train/total_loss": 0.6519086956977844 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.16750293970108032, - "train/contrastive_loss": 1.4402375221252441, - "train/negative_loss": 1.2404251098632812, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.19981247186660767, - "train/total_loss": 0.4555504620075226 + "train/classification_loss": 0.2144571840763092, + "train/contrastive_loss": 0.7091529369354248, + "train/negative_loss": 0.7090263366699219, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00012660828360822052, + "train/total_loss": 0.35628777742385864 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.162539541721344, - "train/contrastive_loss": 2.043846607208252, - "train/negative_loss": 1.5438417196273804, + "train/classification_loss": 0.1336527317762375, + "train/contrastive_loss": 1.205674409866333, + "train/negative_loss": 0.4180910587310791, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.5000048875808716, - "train/total_loss": 0.5713088512420654 + "train/positive_loss": 0.7875833511352539, + "train/total_loss": 0.3747876286506653 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.3157876431941986, - "train/contrastive_loss": 3.13435435295105, - "train/negative_loss": 1.3429925441741943, + "train/classification_loss": 0.22610506415367126, + "train/contrastive_loss": 3.4279775619506836, + "train/negative_loss": 1.413112998008728, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.7913618087768555, - "train/total_loss": 0.942658543586731 + "train/num_positives": 14, + "train/positive_loss": 2.014864683151245, + "train/total_loss": 0.9117006063461304 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.20163027942180634, - "train/contrastive_loss": 2.174553394317627, - "train/negative_loss": 1.7564562559127808, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.4180970788002014, - "train/total_loss": 0.636540949344635 + "train/classification_loss": 0.1818275898694992, + "train/contrastive_loss": 2.3474843502044678, + "train/negative_loss": 1.0960769653320312, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.2514073848724365, + "train/total_loss": 0.651324450969696 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.14368033409118652, - "train/contrastive_loss": 1.1645299196243286, - "train/negative_loss": 0.7936394810676575, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.37089043855667114, - "train/total_loss": 0.37658631801605225 + "train/classification_loss": 0.19788329303264618, + "train/contrastive_loss": 0.7274901866912842, + "train/negative_loss": 0.726530909538269, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.0009592588758096099, + "train/total_loss": 0.3433813452720642 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.25359514355659485, - "train/contrastive_loss": 4.021892547607422, - "train/negative_loss": 2.040065288543701, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.9818270206451416, - "train/total_loss": 1.0579736232757568 + "train/classification_loss": 0.22228887677192688, + "train/contrastive_loss": 3.467336654663086, + "train/negative_loss": 2.3886945247650146, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0786421298980713, + "train/total_loss": 0.9157562255859375 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1497087925672531, - "train/contrastive_loss": 1.94059157371521, - "train/negative_loss": 1.935733437538147, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.004858182743191719, - "train/total_loss": 0.5378271341323853 + "train/classification_loss": 0.22804833948612213, + "train/contrastive_loss": 1.145745038986206, + "train/negative_loss": 1.0951086282730103, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.0506364107131958, + "train/total_loss": 0.457197368144989 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1534537374973297, - "train/contrastive_loss": 2.7932376861572266, - "train/negative_loss": 1.7487716674804688, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.0444658994674683, - "train/total_loss": 0.7121013402938843 + "train/classification_loss": 0.15663203597068787, + "train/contrastive_loss": 3.1898193359375, + "train/negative_loss": 0.8811120390892029, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.3087072372436523, + "train/total_loss": 0.7945959568023682 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1770736128091812, - "train/contrastive_loss": 1.2004387378692627, - "train/negative_loss": 0.7053658962249756, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.4950728416442871, - "train/total_loss": 0.41716134548187256 + "train/classification_loss": 0.20080019533634186, + "train/contrastive_loss": 2.1944327354431152, + "train/negative_loss": 1.15549635887146, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 1.0389363765716553, + "train/total_loss": 0.6396867632865906 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2290739119052887, - "train/contrastive_loss": 2.676208734512329, - "train/negative_loss": 1.6983184814453125, - "train/num_negatives": 40, + "train/classification_loss": 0.16196012496948242, + "train/contrastive_loss": 1.927802324295044, + "train/negative_loss": 1.0773741006851196, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9778903126716614, - "train/total_loss": 0.7643157243728638 + "train/positive_loss": 0.8504282236099243, + "train/total_loss": 0.547520637512207 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.20198047161102295, - "train/contrastive_loss": 1.2813485860824585, - "train/negative_loss": 0.3662380576133728, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.9151105284690857, - "train/total_loss": 0.4582501947879791 + "train/classification_loss": 0.20059916377067566, + "train/contrastive_loss": 1.8498501777648926, + "train/negative_loss": 1.4267992973327637, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.4230509400367737, + "train/total_loss": 0.5705692172050476 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21460647881031036, - "train/contrastive_loss": 2.1343436241149902, - "train/negative_loss": 1.4756584167480469, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.6586852073669434, - "train/total_loss": 0.6414752006530762 + "train/classification_loss": 0.19621223211288452, + "train/contrastive_loss": 0.8714191913604736, + "train/negative_loss": 0.5153063535690308, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.3561128079891205, + "train/total_loss": 0.37049609422683716 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.17162634432315826, - "train/contrastive_loss": 2.854593276977539, - "train/negative_loss": 1.4962608814239502, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.3583325147628784, - "train/total_loss": 0.7425450086593628 + "train/classification_loss": 0.19108864665031433, + "train/contrastive_loss": 2.732180595397949, + "train/negative_loss": 1.5897300243377686, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.1424506902694702, + "train/total_loss": 0.7375247478485107 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.26532667875289917, - "train/contrastive_loss": 1.9233779907226562, - "train/negative_loss": 0.9441226720809937, - "train/num_negatives": 44, + "train/classification_loss": 0.16884231567382812, + "train/contrastive_loss": 0.8711749911308289, + "train/negative_loss": 0.8151357769966125, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.9792553186416626, - "train/total_loss": 0.6500022411346436 + "train/positive_loss": 0.05603921413421631, + "train/total_loss": 0.34307730197906494 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.261185884475708, - "train/contrastive_loss": 1.988071322441101, - "train/negative_loss": 1.1545206308364868, - "train/num_negatives": 44, + "train/classification_loss": 0.14346754550933838, + "train/contrastive_loss": 3.257957696914673, + "train/negative_loss": 2.0725789070129395, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.8335506916046143, - "train/total_loss": 0.6588001251220703 + "train/positive_loss": 1.1853787899017334, + "train/total_loss": 0.795059084892273 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.15181080996990204, - "train/contrastive_loss": 1.1287256479263306, - "train/negative_loss": 0.3970555067062378, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.7316701412200928, - "train/total_loss": 0.3775559365749359 + "train/classification_loss": 0.18945926427841187, + "train/contrastive_loss": 2.7343173027038574, + "train/negative_loss": 0.8981912136077881, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.8361260890960693, + "train/total_loss": 0.7363227605819702 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.15016572177410126, - "train/contrastive_loss": 0.9951174855232239, - "train/negative_loss": 0.529775857925415, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.46534162759780884, - "train/total_loss": 0.34918922185897827 + "train/classification_loss": 0.24139651656150818, + "train/contrastive_loss": 2.6334381103515625, + "train/negative_loss": 1.2412890195846558, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.3921489715576172, + "train/total_loss": 0.7680841684341431 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.12308923155069351, - "train/contrastive_loss": 1.0362533330917358, - "train/negative_loss": 0.8582270741462708, + "train/classification_loss": 0.19805581867694855, + "train/contrastive_loss": 2.717120885848999, + "train/negative_loss": 0.8351744413375854, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.17802630364894867, - "train/total_loss": 0.3303399085998535 + "train/num_positives": 10, + "train/positive_loss": 1.8819464445114136, + "train/total_loss": 0.7414799928665161 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2635440230369568, - "train/contrastive_loss": 2.24818754196167, - "train/negative_loss": 0.8995246887207031, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3486628532409668, - "train/total_loss": 0.7131814956665039 + "train/classification_loss": 0.22040274739265442, + "train/contrastive_loss": 2.877885580062866, + "train/negative_loss": 2.0133190155029297, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8645665645599365, + "train/total_loss": 0.7959798574447632 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2603808045387268, - "train/contrastive_loss": 2.736421585083008, - "train/negative_loss": 1.6207841634750366, + "train/classification_loss": 0.21370400488376617, + "train/contrastive_loss": 1.2733008861541748, + "train/negative_loss": 1.272513508796692, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1156375408172607, - "train/total_loss": 0.8076651096343994 + "train/num_positives": 4, + "train/positive_loss": 0.0007874318398535252, + "train/total_loss": 0.4683641791343689 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19829650223255157, - "train/contrastive_loss": 2.594700336456299, - "train/negative_loss": 1.9730260372161865, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.6216744184494019, - "train/total_loss": 0.7172365784645081 + "train/classification_loss": 0.20344698429107666, + "train/contrastive_loss": 0.1555728167295456, + "train/negative_loss": 0.143561452627182, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.01201136689633131, + "train/total_loss": 0.23456154763698578 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21623510122299194, - "train/contrastive_loss": 0.9760452508926392, - "train/negative_loss": 0.5375193953514099, - "train/num_negatives": 40, + "train/classification_loss": 0.25167909264564514, + "train/contrastive_loss": 3.0801098346710205, + "train/negative_loss": 1.464032769203186, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.43852582573890686, - "train/total_loss": 0.41144415736198425 + "train/positive_loss": 1.6160770654678345, + "train/total_loss": 0.8677010536193848 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2245519608259201, - "train/contrastive_loss": 1.9598215818405151, - "train/negative_loss": 1.5187116861343384, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.44110989570617676, - "train/total_loss": 0.6165162920951843 + "train/classification_loss": 0.22584731876850128, + "train/contrastive_loss": 0.5820425152778625, + "train/negative_loss": 0.4849640727043152, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.09707845747470856, + "train/total_loss": 0.3422558307647705 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.16235777735710144, - "train/contrastive_loss": 1.2126485109329224, - "train/negative_loss": 0.6543004512786865, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5583480596542358, - "train/total_loss": 0.40488749742507935 + "train/classification_loss": 0.165061816573143, + "train/contrastive_loss": 0.9276313781738281, + "train/negative_loss": 0.9270414113998413, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0005899504176340997, + "train/total_loss": 0.3505880832672119 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2475735992193222, - "train/contrastive_loss": 4.001089096069336, - "train/negative_loss": 2.614267110824585, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.38682222366333, - "train/total_loss": 1.0477913618087769 + "train/classification_loss": 0.19334378838539124, + "train/contrastive_loss": 3.6510744094848633, + "train/negative_loss": 1.8619177341461182, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.7891566753387451, + "train/total_loss": 0.9235587120056152 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.23644746840000153, - "train/contrastive_loss": 0.5684397220611572, - "train/negative_loss": 0.5679696798324585, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.000470033468445763, - "train/total_loss": 0.3501354157924652 + "train/classification_loss": 0.2063838392496109, + "train/contrastive_loss": 2.273486614227295, + "train/negative_loss": 1.0990484952926636, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.174438238143921, + "train/total_loss": 0.6610811948776245 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21233730018138885, - "train/contrastive_loss": 2.308206796646118, - "train/negative_loss": 1.1177703142166138, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.1904364824295044, - "train/total_loss": 0.6739786863327026 + "train/classification_loss": 0.22358667850494385, + "train/contrastive_loss": 1.647292137145996, + "train/negative_loss": 1.556389570236206, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.09090255945920944, + "train/total_loss": 0.5530451536178589 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.20101593434810638, - "train/contrastive_loss": 2.5706541538238525, - "train/negative_loss": 2.0885767936706543, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.482077419757843, - "train/total_loss": 0.7151467800140381 + "train/classification_loss": 0.24036137759685516, + "train/contrastive_loss": 2.812830924987793, + "train/negative_loss": 1.8549643754959106, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.9578665494918823, + "train/total_loss": 0.8029276132583618 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.18069371581077576, - "train/contrastive_loss": 3.3847122192382812, - "train/negative_loss": 1.5385546684265137, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.8461576700210571, - "train/total_loss": 0.8576362133026123 + "train/classification_loss": 0.15133407711982727, + "train/contrastive_loss": 1.9341228008270264, + "train/negative_loss": 1.9336551427841187, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.0004676328389905393, + "train/total_loss": 0.538158655166626 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1821729838848114, - "train/contrastive_loss": 1.2910757064819336, - "train/negative_loss": 0.7821313142776489, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5089443922042847, - "train/total_loss": 0.44038814306259155 + "train/classification_loss": 0.2138678878545761, + "train/contrastive_loss": 0.9629563093185425, + "train/negative_loss": 0.45816758275032043, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.5047887563705444, + "train/total_loss": 0.40645915269851685 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.20289146900177002, - "train/contrastive_loss": 1.1795532703399658, - "train/negative_loss": 1.1466301679611206, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.032923147082328796, - "train/total_loss": 0.4388021230697632 + "train/classification_loss": 0.2579900622367859, + "train/contrastive_loss": 4.260730266571045, + "train/negative_loss": 4.012881755828857, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.24784834682941437, + "train/total_loss": 1.1101361513137817 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2164650559425354, - "train/contrastive_loss": 1.3453115224838257, - "train/negative_loss": 1.3351221084594727, - "train/num_negatives": 46, + "train/classification_loss": 0.2206651121377945, + "train/contrastive_loss": 1.5702457427978516, + "train/negative_loss": 0.9921298623085022, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.5781158804893494, + "train/total_loss": 0.5347142815589905 + }, + { + "epoch": 5.633802816901408, + "step": 1600, + "train/classification_loss": 0.2739638388156891, + "train/contrastive_loss": 3.6081268787384033, + "train/negative_loss": 2.3873746395111084, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.010189397260546684, - "train/total_loss": 0.485527366399765 + "train/positive_loss": 1.220752239227295, + "train/total_loss": 0.9955892562866211 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19110889732837677, - "train/contrastive_loss": 2.095885753631592, - "train/negative_loss": 2.093590259552002, + "train/classification_loss": 0.1533750593662262, + "train/contrastive_loss": 1.613090991973877, + "train/negative_loss": 0.8586022257804871, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0022953846491873264, - "train/total_loss": 0.6102860569953918 + "train/num_positives": 10, + "train/positive_loss": 0.7544887065887451, + "train/total_loss": 0.475993275642395 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.17926393449306488, - "train/contrastive_loss": 0.8854845762252808, - "train/negative_loss": 0.8854174613952637, + "train/classification_loss": 0.20242871344089508, + "train/contrastive_loss": 3.991438150405884, + "train/negative_loss": 2.162257194519043, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.8291809558868408, + "train/total_loss": 1.0007163286209106 + }, + { + "epoch": 5.633802816901408, + "step": 1600, + "train/classification_loss": 0.20762135088443756, + "train/contrastive_loss": 1.1606533527374268, + "train/negative_loss": 1.1593447923660278, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0013085369719192386, + "train/total_loss": 0.4397520422935486 + }, + { + "epoch": 5.633802816901408, + "step": 1600, + "train/classification_loss": 0.2719421088695526, + "train/contrastive_loss": 1.808800220489502, + "train/negative_loss": 1.7140024900436401, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 6.714048504363745e-05, - "train/total_loss": 0.35636085271835327 + "train/positive_loss": 0.09479769319295883, + "train/total_loss": 0.6337021589279175 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2076270431280136, - "train/contrastive_loss": 2.7487316131591797, - "train/negative_loss": 2.1978065967559814, - "train/num_negatives": 36, + "train/classification_loss": 0.20392394065856934, + "train/contrastive_loss": 0.8441608548164368, + "train/negative_loss": 0.6126073002815247, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.2315535545349121, + "train/total_loss": 0.37275612354278564 + }, + { + "epoch": 5.633802816901408, + "step": 1600, + "train/classification_loss": 0.3177470862865448, + "train/contrastive_loss": 3.02396559715271, + "train/negative_loss": 2.4306905269622803, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.5509251356124878, - "train/total_loss": 0.7573733925819397 + "train/positive_loss": 0.5932750105857849, + "train/total_loss": 0.9225401878356934 + }, + { + "epoch": 5.633802816901408, + "step": 1600, + "train/classification_loss": 0.17588309943675995, + "train/contrastive_loss": 1.8991339206695557, + "train/negative_loss": 0.9913210272789001, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9078129529953003, + "train/total_loss": 0.5557098984718323 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.2471385896205902, - "train/contrastive_loss": 1.9129303693771362, - "train/negative_loss": 1.0560591220855713, + "train/classification_loss": 0.21649636328220367, + "train/contrastive_loss": 2.3409266471862793, + "train/negative_loss": 2.0015835762023926, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.8568712472915649, - "train/total_loss": 0.6297246813774109 + "train/num_positives": 14, + "train/positive_loss": 0.33934295177459717, + "train/total_loss": 0.6846817135810852 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.18602018058300018, - "train/contrastive_loss": 2.8376505374908447, - "train/negative_loss": 1.4491729736328125, + "train/classification_loss": 0.2586718797683716, + "train/contrastive_loss": 2.231245517730713, + "train/negative_loss": 2.2312281131744385, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.3884775638580322, - "train/total_loss": 0.7535502910614014 + "train/num_positives": 2, + "train/positive_loss": 1.7404707250534557e-05, + "train/total_loss": 0.7049210071563721 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1640855222940445, - "train/contrastive_loss": 1.1919710636138916, - "train/negative_loss": 0.7654391527175903, + "train/classification_loss": 0.2034951001405716, + "train/contrastive_loss": 2.8478569984436035, + "train/negative_loss": 1.6936752796173096, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4265318810939789, - "train/total_loss": 0.40247973799705505 + "train/num_positives": 16, + "train/positive_loss": 1.1541815996170044, + "train/total_loss": 0.773066520690918 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.30398231744766235, - "train/contrastive_loss": 1.6804981231689453, - "train/negative_loss": 1.3035701513290405, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.3769279420375824, - "train/total_loss": 0.6400819420814514 + "train/classification_loss": 0.18201115727424622, + "train/contrastive_loss": 1.479737639427185, + "train/negative_loss": 0.9148036241531372, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.5649340152740479, + "train/total_loss": 0.47795867919921875 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.12956857681274414, - "train/contrastive_loss": 0.842488169670105, - "train/negative_loss": 0.8424350023269653, - "train/num_negatives": 48, + "train/classification_loss": 0.22470872104167938, + "train/contrastive_loss": 0.9826817512512207, + "train/negative_loss": 0.7071917057037354, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 5.3170071623753756e-05, - "train/total_loss": 0.2980661988258362 + "train/positive_loss": 0.27549004554748535, + "train/total_loss": 0.4212450683116913 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.16824349761009216, - "train/contrastive_loss": 0.623043954372406, - "train/negative_loss": 0.2321988195180893, + "train/classification_loss": 0.22552569210529327, + "train/contrastive_loss": 1.206992506980896, + "train/negative_loss": 0.7897206544876099, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.3908451199531555, - "train/total_loss": 0.2928522825241089 + "train/num_positives": 14, + "train/positive_loss": 0.4172718822956085, + "train/total_loss": 0.46692419052124023 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.13863293826580048, - "train/contrastive_loss": 1.0796566009521484, - "train/negative_loss": 0.9336093068122864, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.14604729413986206, - "train/total_loss": 0.35456424951553345 + "train/classification_loss": 0.3138810694217682, + "train/contrastive_loss": 2.2114133834838867, + "train/negative_loss": 1.7286598682403564, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.4827536344528198, + "train/total_loss": 0.7561637163162231 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21767717599868774, - "train/contrastive_loss": 0.9840031266212463, - "train/negative_loss": 0.8224031329154968, - "train/num_negatives": 28, + "train/classification_loss": 0.1525324434041977, + "train/contrastive_loss": 0.8160380125045776, + "train/negative_loss": 0.6123915910720825, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.16159997880458832, - "train/total_loss": 0.4144778251647949 + "train/positive_loss": 0.20364642143249512, + "train/total_loss": 0.31574004888534546 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.18850520253181458, - "train/contrastive_loss": 2.1888010501861572, - "train/negative_loss": 1.154191255569458, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0346097946166992, - "train/total_loss": 0.6262654066085815 + "train/classification_loss": 0.15518178045749664, + "train/contrastive_loss": 0.9236260652542114, + "train/negative_loss": 0.33020737767219543, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.5934186577796936, + "train/total_loss": 0.3399069905281067 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1713729202747345, - "train/contrastive_loss": 0.7926191687583923, - "train/negative_loss": 0.7886372208595276, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.003981932997703552, - "train/total_loss": 0.3298967480659485 + "train/classification_loss": 0.18703415989875793, + "train/contrastive_loss": 0.9746322631835938, + "train/negative_loss": 0.7493367195129395, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.22529557347297668, + "train/total_loss": 0.3819606304168701 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21429887413978577, - "train/contrastive_loss": 3.2141265869140625, - "train/negative_loss": 1.4134249687194824, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.8007017374038696, - "train/total_loss": 0.8571242094039917 + "train/classification_loss": 0.20868200063705444, + "train/contrastive_loss": 2.178956985473633, + "train/negative_loss": 1.1348897218704224, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.044067144393921, + "train/total_loss": 0.6444734334945679 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.22752733528614044, - "train/contrastive_loss": 2.872220993041992, - "train/negative_loss": 1.4064831733703613, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.4657378196716309, - "train/total_loss": 0.8019715547561646 + "train/classification_loss": 0.22476527094841003, + "train/contrastive_loss": 1.185799241065979, + "train/negative_loss": 0.9723201394081116, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.21347910165786743, + "train/total_loss": 0.46192511916160583 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1699645072221756, - "train/contrastive_loss": 0.8488954305648804, - "train/negative_loss": 0.5494264960289001, + "train/classification_loss": 0.1576899141073227, + "train/contrastive_loss": 0.6182948350906372, + "train/negative_loss": 0.3953501880168915, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.29946890473365784, - "train/total_loss": 0.33974361419677734 + "train/num_positives": 16, + "train/positive_loss": 0.22294463217258453, + "train/total_loss": 0.2813488841056824 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.1863260418176651, - "train/contrastive_loss": 3.4795570373535156, - "train/negative_loss": 2.282301664352417, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1972553730010986, - "train/total_loss": 0.882237434387207 + "train/classification_loss": 0.19558343291282654, + "train/contrastive_loss": 1.8985164165496826, + "train/negative_loss": 0.9347307085990906, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.9637857675552368, + "train/total_loss": 0.5752867460250854 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.24149039387702942, - "train/contrastive_loss": 2.6990199089050293, - "train/negative_loss": 1.4091668128967285, + "train/classification_loss": 0.27345722913742065, + "train/contrastive_loss": 2.0676190853118896, + "train/negative_loss": 2.062793254852295, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.2898530960083008, - "train/total_loss": 0.7812943458557129 + "train/num_positives": 2, + "train/positive_loss": 0.004825713578611612, + "train/total_loss": 0.6869810819625854 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.21949917078018188, - "train/contrastive_loss": 2.1407928466796875, - "train/negative_loss": 1.7831676006317139, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.3576253056526184, - "train/total_loss": 0.6476577520370483 + "train/classification_loss": 0.15852481126785278, + "train/contrastive_loss": 2.91733980178833, + "train/negative_loss": 1.1113064289093018, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.8060334920883179, + "train/total_loss": 0.7419927716255188 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19271382689476013, - "train/contrastive_loss": 3.111300468444824, - "train/negative_loss": 1.8778396844863892, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.2334606647491455, - "train/total_loss": 0.8149739503860474 + "train/classification_loss": 0.21702103316783905, + "train/contrastive_loss": 1.9533376693725586, + "train/negative_loss": 1.8773987293243408, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.07593892514705658, + "train/total_loss": 0.6076885461807251 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.20110633969306946, - "train/contrastive_loss": 2.1647958755493164, - "train/negative_loss": 1.7204211950302124, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.44437476992607117, - "train/total_loss": 0.6340655088424683 + "train/classification_loss": 0.20359709858894348, + "train/contrastive_loss": 2.540095806121826, + "train/negative_loss": 0.6672948598861694, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.8728008270263672, + "train/total_loss": 0.7116162776947021 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.22334855794906616, - "train/contrastive_loss": 2.9585750102996826, - "train/negative_loss": 2.1633810997009277, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.7951939702033997, - "train/total_loss": 0.8150635957717896 + "train/classification_loss": 0.20051588118076324, + "train/contrastive_loss": 4.684122085571289, + "train/negative_loss": 4.684116363525391, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 5.686307304131333e-06, + "train/total_loss": 1.1373403072357178 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.24571965634822845, - "train/contrastive_loss": 2.2378103733062744, - "train/negative_loss": 1.7925496101379395, + "train/classification_loss": 0.20230109989643097, + "train/contrastive_loss": 0.7998157739639282, + "train/negative_loss": 0.5881301164627075, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.44526082277297974, - "train/total_loss": 0.6932817101478577 + "train/positive_loss": 0.2116856873035431, + "train/total_loss": 0.3622642755508423 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19804610311985016, - "train/contrastive_loss": 0.9031757116317749, - "train/negative_loss": 0.8942774534225464, + "train/classification_loss": 0.22185884416103363, + "train/contrastive_loss": 2.8162074089050293, + "train/negative_loss": 1.118725061416626, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.008898268453776836, - "train/total_loss": 0.3786812424659729 + "train/num_positives": 8, + "train/positive_loss": 1.6974823474884033, + "train/total_loss": 0.7851003408432007 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.17461691796779633, - "train/contrastive_loss": 0.9045513272285461, - "train/negative_loss": 0.21023105084896088, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6943202614784241, - "train/total_loss": 0.35552719235420227 + "train/classification_loss": 0.17553521692752838, + "train/contrastive_loss": 2.298393487930298, + "train/negative_loss": 1.1296616792678833, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.1687318086624146, + "train/total_loss": 0.6352139115333557 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.19503344595432281, - "train/contrastive_loss": 2.064955711364746, - "train/negative_loss": 0.8357704877853394, - "train/num_negatives": 46, + "train/classification_loss": 0.25741371512413025, + "train/contrastive_loss": 1.8554365634918213, + "train/negative_loss": 1.36845064163208, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.2291853427886963, - "train/total_loss": 0.6080245971679688 + "train/positive_loss": 0.4869858920574188, + "train/total_loss": 0.6285010576248169 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.25202780961990356, - "train/contrastive_loss": 1.5976955890655518, - "train/negative_loss": 1.5976955890655518, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5715669393539429 - }, - { - "epoch": 6.083650190114068, - "eval_exact_match_accuracy": 0.21333333333333335, - "eval_hamming_loss": 0.07563025210084033, - "eval_loss": 0.596592903137207, - "eval_macro_f1": 0.15091558134717462, - "eval_macro_precision": 0.28379378813943734, - "eval_macro_recall": 0.11888294932162789, - "eval_micro_f1": 0.4407622203811102, - "eval_micro_precision": 0.8109756097560976, - "eval_micro_recall": 0.3026166097838453, - "eval_runtime": 2.6369, - "eval_samples_per_second": 199.096, - "eval_steps_per_second": 25.029, + "train/classification_loss": 0.1986110359430313, + "train/contrastive_loss": 0.9597651958465576, + "train/negative_loss": 0.6958547830581665, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.2639104127883911, + "train/total_loss": 0.39056408405303955 + }, + { + "epoch": 5.633802816901408, + "eval_exact_match_accuracy": 0.2292768959435626, + "eval_hamming_loss": 0.07293287685444548, + "eval_loss": 0.6104494333267212, + "eval_macro_f1": 0.21772971254811033, + "eval_macro_precision": 0.3684285285076008, + "eval_macro_recall": 0.1696943358517272, + "eval_micro_f1": 0.45120999219359875, + "eval_micro_precision": 0.8425655976676385, + "eval_micro_recall": 0.30810234541577824, + "eval_runtime": 2.8442, + "eval_samples_per_second": 199.356, + "eval_steps_per_second": 24.963, "step": 1600 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.14773133397102356, - "train/contrastive_loss": 0.9247452616691589, - "train/negative_loss": 0.4463837444782257, - "train/num_negatives": 22, - "train/num_positives": 32, - "train/positive_loss": 0.4783615171909332, - "train/total_loss": 0.3326804041862488 + "train/classification_loss": 0.19540128111839294, + "train/contrastive_loss": 1.2757567167282104, + "train/negative_loss": 1.1663979291915894, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.1093587651848793, + "train/total_loss": 0.45055264234542847 }, { - "epoch": 6.083650190114068, + "epoch": 5.633802816901408, "step": 1600, - "train/classification_loss": 0.261381596326828, - "train/contrastive_loss": 1.2548542022705078, - "train/negative_loss": 1.1037843227386475, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.15106986463069916, - "train/total_loss": 0.512352466583252 + "train/classification_loss": 0.20016218721866608, + "train/contrastive_loss": 1.5143775939941406, + "train/negative_loss": 1.4740484952926636, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.040329139679670334, + "train/total_loss": 0.503037691116333 }, { - "epoch": 6.273764258555133, - "grad_norm": 7.449739456176758, - "learning_rate": 1.976453576864536e-05, - "loss": 0.8074, + "epoch": 5.809859154929578, + "grad_norm": 12.960160255432129, + "learning_rate": 1.9782100070472167e-05, + "loss": 0.9118, "step": 1650 }, { - "epoch": 6.273764258555133, + "epoch": 5.809859154929578, "step": 1650, - "train/classification_loss": 0.16764649748802185, - "train/contrastive_loss": 0.8647753000259399, - "train/negative_loss": 0.34381040930747986, - "train/num_negatives": 30, - "train/num_positives": 24, - "train/positive_loss": 0.5209648609161377, - "train/total_loss": 0.3406015634536743 + "train/classification_loss": 0.19248813390731812, + "train/contrastive_loss": 0.9245613217353821, + "train/negative_loss": 0.8709220886230469, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.05363922193646431, + "train/total_loss": 0.37740039825439453 }, { - "epoch": 6.273764258555133, + "epoch": 5.809859154929578, "step": 1650, - "train/classification_loss": 0.19089314341545105, - "train/contrastive_loss": 0.7993524074554443, - "train/negative_loss": 0.48006609082221985, + "train/classification_loss": 0.20316040515899658, + "train/contrastive_loss": 1.0644290447235107, + "train/negative_loss": 0.5469610095024109, "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.3192863464355469, - "train/total_loss": 0.35076361894607544 + "train/num_positives": 12, + "train/positive_loss": 0.5174680352210999, + "train/total_loss": 0.4160462021827698 }, { - "epoch": 6.4638783269961975, - "grad_norm": 11.640963554382324, - "learning_rate": 1.9756925418569255e-05, - "loss": 0.8247, + "epoch": 5.985915492957746, + "grad_norm": 12.231520652770996, + "learning_rate": 1.977505285412262e-05, + "loss": 0.8783, "step": 1700 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.28365591168403625, - "train/contrastive_loss": 2.2342581748962402, - "train/negative_loss": 1.4337579011917114, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8005002737045288, - "train/total_loss": 0.7305075526237488 + "train/classification_loss": 0.221462219953537, + "train/contrastive_loss": 2.4590988159179688, + "train/negative_loss": 1.7600843906402588, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.6990143656730652, + "train/total_loss": 0.7132819890975952 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.23356275260448456, - "train/contrastive_loss": 2.84515380859375, - "train/negative_loss": 1.434964895248413, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.4101887941360474, - "train/total_loss": 0.8025935292243958 + "train/classification_loss": 0.26578959822654724, + "train/contrastive_loss": 1.0746912956237793, + "train/negative_loss": 0.6682382225990295, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.40645313262939453, + "train/total_loss": 0.4807278513908386 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1761004477739334, - "train/contrastive_loss": 2.148435354232788, - "train/negative_loss": 0.6296899318695068, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.5187454223632812, - "train/total_loss": 0.6057875156402588 + "train/classification_loss": 0.26474907994270325, + "train/contrastive_loss": 3.065286636352539, + "train/negative_loss": 1.94959557056427, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.115691065788269, + "train/total_loss": 0.8778064250946045 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.20248109102249146, - "train/contrastive_loss": 2.098848819732666, - "train/negative_loss": 1.0437722206115723, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.0550765991210938, - "train/total_loss": 0.6222508549690247 + "train/classification_loss": 0.14364959299564362, + "train/contrastive_loss": 0.9807185530662537, + "train/negative_loss": 0.8213047981262207, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.15941375494003296, + "train/total_loss": 0.33979332447052 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.16151446104049683, - "train/contrastive_loss": 1.2047245502471924, - "train/negative_loss": 0.5100447535514832, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.694679856300354, - "train/total_loss": 0.40245938301086426 + "train/classification_loss": 0.2084214836359024, + "train/contrastive_loss": 2.3200767040252686, + "train/negative_loss": 2.0234482288360596, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.296628475189209, + "train/total_loss": 0.6724368333816528 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19062811136245728, - "train/contrastive_loss": 3.1450133323669434, - "train/negative_loss": 1.4669756889343262, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.6780376434326172, - "train/total_loss": 0.8196308016777039 + "train/classification_loss": 0.2177915722131729, + "train/contrastive_loss": 2.948605537414551, + "train/negative_loss": 1.6253365278244019, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.3232691287994385, + "train/total_loss": 0.8075127005577087 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2632043957710266, - "train/contrastive_loss": 2.173308849334717, - "train/negative_loss": 1.9205602407455444, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.25274863839149475, - "train/total_loss": 0.6978662014007568 + "train/classification_loss": 0.21262404322624207, + "train/contrastive_loss": 2.0823614597320557, + "train/negative_loss": 1.1420468091964722, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9403145909309387, + "train/total_loss": 0.6290963292121887 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1778876632452011, - "train/contrastive_loss": 1.209371566772461, - "train/negative_loss": 1.1070261001586914, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.10234545171260834, - "train/total_loss": 0.41976198554039 + "train/classification_loss": 0.21171583235263824, + "train/contrastive_loss": 1.133407711982727, + "train/negative_loss": 1.132680892944336, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0007267850451171398, + "train/total_loss": 0.4383973777294159 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.15556134283542633, - "train/contrastive_loss": 1.3343573808670044, - "train/negative_loss": 1.1299916505813599, + "train/classification_loss": 0.13563896715641022, + "train/contrastive_loss": 0.6403701305389404, + "train/negative_loss": 0.40667724609375, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.20436576008796692, - "train/total_loss": 0.4224328398704529 + "train/positive_loss": 0.23369285464286804, + "train/total_loss": 0.263713002204895 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.27527645230293274, - "train/contrastive_loss": 2.9943971633911133, - "train/negative_loss": 1.9051058292388916, + "train/classification_loss": 0.2288937270641327, + "train/contrastive_loss": 2.151214599609375, + "train/negative_loss": 0.9454410076141357, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0892912149429321, - "train/total_loss": 0.8741558790206909 + "train/num_positives": 14, + "train/positive_loss": 1.2057735919952393, + "train/total_loss": 0.6591366529464722 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.20630522072315216, - "train/contrastive_loss": 2.1884660720825195, - "train/negative_loss": 1.6160128116607666, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.5724532604217529, - "train/total_loss": 0.6439984440803528 + "train/classification_loss": 0.17437100410461426, + "train/contrastive_loss": 1.8770527839660645, + "train/negative_loss": 0.830203115940094, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.0468497276306152, + "train/total_loss": 0.5497815608978271 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1423015296459198, - "train/contrastive_loss": 2.1561601161956787, - "train/negative_loss": 0.6485298871994019, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.5076302289962769, - "train/total_loss": 0.5735335350036621 + "train/classification_loss": 0.19360946118831635, + "train/contrastive_loss": 1.2126843929290771, + "train/negative_loss": 1.2080878019332886, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.00459654163569212, + "train/total_loss": 0.4361463487148285 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.23402121663093567, - "train/contrastive_loss": 2.8091282844543457, - "train/negative_loss": 1.6284306049346924, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.1806977987289429, - "train/total_loss": 0.7958469390869141 + "train/classification_loss": 0.21134503185749054, + "train/contrastive_loss": 3.1952462196350098, + "train/negative_loss": 1.8184351921081543, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.376810908317566, + "train/total_loss": 0.8503942489624023 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.14980025589466095, - "train/contrastive_loss": 2.145012617111206, - "train/negative_loss": 2.1229701042175293, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.022042514756321907, - "train/total_loss": 0.578802764415741 + "train/classification_loss": 0.20954521000385284, + "train/contrastive_loss": 2.272305727005005, + "train/negative_loss": 1.4754786491394043, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.7968271374702454, + "train/total_loss": 0.6640063524246216 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1469021886587143, - "train/contrastive_loss": 1.6674000024795532, - "train/negative_loss": 1.4252352714538574, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.24216468632221222, - "train/total_loss": 0.48038220405578613 + "train/classification_loss": 0.1568308174610138, + "train/contrastive_loss": 3.2329628467559814, + "train/negative_loss": 0.8909221291542053, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.342040777206421, + "train/total_loss": 0.8034234046936035 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.15596812963485718, - "train/contrastive_loss": 1.2459988594055176, - "train/negative_loss": 0.7011423707008362, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.5448564887046814, - "train/total_loss": 0.40516790747642517 + "train/classification_loss": 0.18643267452716827, + "train/contrastive_loss": 1.139142632484436, + "train/negative_loss": 0.6296855211257935, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.5094571113586426, + "train/total_loss": 0.41426122188568115 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2405891716480255, - "train/contrastive_loss": 2.767855405807495, - "train/negative_loss": 1.6635417938232422, - "train/num_negatives": 40, + "train/classification_loss": 0.15659183263778687, + "train/contrastive_loss": 1.1242566108703613, + "train/negative_loss": 0.5465371608734131, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.104313611984253, - "train/total_loss": 0.7941602468490601 + "train/positive_loss": 0.577719509601593, + "train/total_loss": 0.3814431428909302 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1918724924325943, - "train/contrastive_loss": 1.2165744304656982, - "train/negative_loss": 0.27739566564559937, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.9391787648200989, - "train/total_loss": 0.4351873993873596 + "train/classification_loss": 0.21117204427719116, + "train/contrastive_loss": 1.4498136043548584, + "train/negative_loss": 0.9634303450584412, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.4863832890987396, + "train/total_loss": 0.5011347532272339 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2082262635231018, - "train/contrastive_loss": 1.5611348152160645, - "train/negative_loss": 1.2152106761932373, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.3459240794181824, - "train/total_loss": 0.5204532146453857 + "train/classification_loss": 0.1872931718826294, + "train/contrastive_loss": 0.803306519985199, + "train/negative_loss": 0.5756934881210327, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.22761301696300507, + "train/total_loss": 0.34795448184013367 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.16658636927604675, - "train/contrastive_loss": 1.9956740140914917, - "train/negative_loss": 1.1820802688598633, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8135937452316284, - "train/total_loss": 0.5657211542129517 + "train/classification_loss": 0.19166812300682068, + "train/contrastive_loss": 3.7552285194396973, + "train/negative_loss": 1.8110504150390625, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.9441779851913452, + "train/total_loss": 0.9427138566970825 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2531900107860565, - "train/contrastive_loss": 1.3479218482971191, - "train/negative_loss": 0.5609212517738342, - "train/num_negatives": 44, + "train/classification_loss": 0.1606128066778183, + "train/contrastive_loss": 1.4483282566070557, + "train/negative_loss": 1.387937307357788, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.7870006561279297, - "train/total_loss": 0.5227743983268738 + "train/positive_loss": 0.06039094552397728, + "train/total_loss": 0.45027846097946167 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.26505792140960693, - "train/contrastive_loss": 1.8952958583831787, - "train/negative_loss": 1.6524852514266968, - "train/num_negatives": 44, + "train/classification_loss": 0.13656173646450043, + "train/contrastive_loss": 2.849153518676758, + "train/negative_loss": 2.0549163818359375, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.24281062185764313, - "train/total_loss": 0.6441171169281006 + "train/positive_loss": 0.7942370176315308, + "train/total_loss": 0.7063924670219421 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.14757242798805237, - "train/contrastive_loss": 1.2798657417297363, - "train/negative_loss": 0.6447213292121887, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6351444721221924, - "train/total_loss": 0.4035455882549286 + "train/classification_loss": 0.1886182427406311, + "train/contrastive_loss": 3.554659366607666, + "train/negative_loss": 1.2033625841140747, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 2.3512966632843018, + "train/total_loss": 0.8995501399040222 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1441599279642105, - "train/contrastive_loss": 0.669651210308075, - "train/negative_loss": 0.35449644923210144, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.3151547610759735, - "train/total_loss": 0.2780901789665222 + "train/classification_loss": 0.2407016158103943, + "train/contrastive_loss": 2.665372133255005, + "train/negative_loss": 1.462630033493042, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.202742099761963, + "train/total_loss": 0.7737760543823242 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.12547339498996735, - "train/contrastive_loss": 2.078812599182129, - "train/negative_loss": 1.255866289138794, + "train/classification_loss": 0.1961059272289276, + "train/contrastive_loss": 2.311809539794922, + "train/negative_loss": 1.3634473085403442, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8229463696479797, - "train/total_loss": 0.5412359237670898 + "train/num_positives": 10, + "train/positive_loss": 0.9483621716499329, + "train/total_loss": 0.6584678292274475 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.274122029542923, - "train/contrastive_loss": 1.9316766262054443, - "train/negative_loss": 0.6734241843223572, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2582523822784424, - "train/total_loss": 0.6604573726654053 + "train/classification_loss": 0.20183724164962769, + "train/contrastive_loss": 2.424044609069824, + "train/negative_loss": 1.7180655002593994, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.70597904920578, + "train/total_loss": 0.6866461634635925 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.25020018219947815, - "train/contrastive_loss": 3.0414397716522217, - "train/negative_loss": 1.4562053680419922, + "train/classification_loss": 0.21263127028942108, + "train/contrastive_loss": 2.2292354106903076, + "train/negative_loss": 2.2167515754699707, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5852344036102295, - "train/total_loss": 0.8584882020950317 + "train/num_positives": 4, + "train/positive_loss": 0.012483775615692139, + "train/total_loss": 0.6584783792495728 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19550909101963043, - "train/contrastive_loss": 2.7293052673339844, - "train/negative_loss": 2.1714980602264404, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5578071475028992, - "train/total_loss": 0.7413701415061951 + "train/classification_loss": 0.19967931509017944, + "train/contrastive_loss": 0.4156442880630493, + "train/negative_loss": 0.4051029086112976, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.010541382245719433, + "train/total_loss": 0.28280818462371826 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2077874094247818, - "train/contrastive_loss": 1.601229190826416, - "train/negative_loss": 0.6362680792808533, - "train/num_negatives": 40, + "train/classification_loss": 0.24373365938663483, + "train/contrastive_loss": 3.2246389389038086, + "train/negative_loss": 1.6302928924560547, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.9649611711502075, - "train/total_loss": 0.5280332565307617 - }, - { - "epoch": 6.4638783269961975, - "step": 1700, - "train/classification_loss": 0.22112783789634705, - "train/contrastive_loss": 1.8836536407470703, - "train/negative_loss": 1.488613486289978, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.3950401544570923, - "train/total_loss": 0.5978585481643677 + "train/positive_loss": 1.594346046447754, + "train/total_loss": 0.8886614441871643 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.16052529215812683, - "train/contrastive_loss": 0.8945627212524414, - "train/negative_loss": 0.4876456558704376, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.4069170355796814, - "train/total_loss": 0.3394378423690796 - }, - { - "epoch": 6.4638783269961975, - "step": 1700, - "train/classification_loss": 0.24042533338069916, - "train/contrastive_loss": 3.253828287124634, - "train/negative_loss": 2.1318142414093018, + "train/classification_loss": 0.22044453024864197, + "train/contrastive_loss": 1.211272120475769, + "train/negative_loss": 1.0419281721115112, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.122014045715332, - "train/total_loss": 0.8911910057067871 + "train/num_positives": 10, + "train/positive_loss": 0.1693439483642578, + "train/total_loss": 0.46269893646240234 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.24331878125667572, - "train/contrastive_loss": 0.8676303625106812, - "train/negative_loss": 0.8660835027694702, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.001546863466501236, - "train/total_loss": 0.41684484481811523 + "train/classification_loss": 0.1694960594177246, + "train/contrastive_loss": 0.7772913575172424, + "train/negative_loss": 0.6609813570976257, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.1163100153207779, + "train/total_loss": 0.3249543309211731 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.21012167632579803, - "train/contrastive_loss": 1.887359857559204, - "train/negative_loss": 0.9531071186065674, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.9342526793479919, - "train/total_loss": 0.587593674659729 + "train/classification_loss": 0.19062626361846924, + "train/contrastive_loss": 3.0883870124816895, + "train/negative_loss": 1.5537185668945312, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.5346685647964478, + "train/total_loss": 0.8083036541938782 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1954040378332138, - "train/contrastive_loss": 2.9483864307403564, - "train/negative_loss": 1.7322033643722534, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.216183066368103, - "train/total_loss": 0.7850813269615173 + "train/classification_loss": 0.20361821353435516, + "train/contrastive_loss": 1.8659075498580933, + "train/negative_loss": 1.1411710977554321, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7247364521026611, + "train/total_loss": 0.576799750328064 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.18148472905158997, - "train/contrastive_loss": 3.985342502593994, - "train/negative_loss": 1.537305474281311, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.4480371475219727, - "train/total_loss": 0.978553295135498 + "train/classification_loss": 0.21600548923015594, + "train/contrastive_loss": 1.862668752670288, + "train/negative_loss": 1.6935091018676758, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.16915962100028992, + "train/total_loss": 0.5885392427444458 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.17871740460395813, - "train/contrastive_loss": 1.8626443147659302, - "train/negative_loss": 0.7882256507873535, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 1.0744186639785767, - "train/total_loss": 0.5512462854385376 + "train/classification_loss": 0.24313080310821533, + "train/contrastive_loss": 2.2547178268432617, + "train/negative_loss": 1.174124002456665, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.0805939435958862, + "train/total_loss": 0.6940743923187256 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1915382444858551, - "train/contrastive_loss": 1.3810514211654663, - "train/negative_loss": 1.2202191352844238, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.1608322560787201, - "train/total_loss": 0.4677485227584839 + "train/classification_loss": 0.14961303770542145, + "train/contrastive_loss": 2.239539861679077, + "train/negative_loss": 2.2394859790802, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 5.387864075601101e-05, + "train/total_loss": 0.5975210070610046 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.22627508640289307, - "train/contrastive_loss": 1.751883864402771, - "train/negative_loss": 1.3378651142120361, + "train/classification_loss": 0.19872525334358215, + "train/contrastive_loss": 0.8004911541938782, + "train/negative_loss": 0.7016170620918274, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.41401875019073486, - "train/total_loss": 0.5766518712043762 + "train/positive_loss": 0.09887408465147018, + "train/total_loss": 0.3588234782218933 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.20269836485385895, - "train/contrastive_loss": 2.2348756790161133, - "train/negative_loss": 2.217637062072754, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.01723853126168251, - "train/total_loss": 0.6496735215187073 + "train/classification_loss": 0.2644781768321991, + "train/contrastive_loss": 2.931800365447998, + "train/negative_loss": 2.60398268699646, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.3278176784515381, + "train/total_loss": 0.850838303565979 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.20335166156291962, + "train/contrastive_loss": 0.6078771352767944, + "train/negative_loss": 0.4523654878139496, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.15551163256168365, + "train/total_loss": 0.32492709159851074 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.2844522297382355, + "train/contrastive_loss": 4.9069600105285645, + "train/negative_loss": 2.1426827907562256, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 2.764277219772339, + "train/total_loss": 1.2658442258834839 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.1465490609407425, + "train/contrastive_loss": 0.670142412185669, + "train/negative_loss": 0.4068988859653473, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.26324349641799927, + "train/total_loss": 0.28057754039764404 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.1882716566324234, + "train/contrastive_loss": 2.1887221336364746, + "train/negative_loss": 0.973315417766571, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.2154067754745483, + "train/total_loss": 0.6260160803794861 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.2017248421907425, + "train/contrastive_loss": 1.0781397819519043, + "train/negative_loss": 1.0779799222946167, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00015984913625288755, + "train/total_loss": 0.4173527956008911 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.182021826505661, - "train/contrastive_loss": 1.1526817083358765, - "train/negative_loss": 1.1512413024902344, + "train/classification_loss": 0.264041006565094, + "train/contrastive_loss": 1.027521014213562, + "train/negative_loss": 0.9978155493736267, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.0014403578825294971, - "train/total_loss": 0.4125581681728363 + "train/positive_loss": 0.029705418273806572, + "train/total_loss": 0.4695452153682709 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.20768427848815918, - "train/contrastive_loss": 2.7083470821380615, - "train/negative_loss": 2.2220990657806396, - "train/num_negatives": 36, + "train/classification_loss": 0.19865308701992035, + "train/contrastive_loss": 1.1342270374298096, + "train/negative_loss": 0.6809921264648438, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.4532349109649658, + "train/total_loss": 0.42549848556518555 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.3010791838169098, + "train/contrastive_loss": 2.9710891246795654, + "train/negative_loss": 2.2176454067230225, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.4862479269504547, - "train/total_loss": 0.7493537068367004 + "train/positive_loss": 0.753443717956543, + "train/total_loss": 0.8952970504760742 + }, + { + "epoch": 5.985915492957746, + "step": 1700, + "train/classification_loss": 0.17824791371822357, + "train/contrastive_loss": 1.940492868423462, + "train/negative_loss": 1.0547819137573242, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8857110142707825, + "train/total_loss": 0.5663464665412903 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.23052796721458435, - "train/contrastive_loss": 0.7456792593002319, - "train/negative_loss": 0.6617339253425598, + "train/classification_loss": 0.21051530539989471, + "train/contrastive_loss": 2.504512071609497, + "train/negative_loss": 2.1072912216186523, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.08394533395767212, - "train/total_loss": 0.3796638250350952 + "train/num_positives": 14, + "train/positive_loss": 0.39722082018852234, + "train/total_loss": 0.7114177346229553 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.17583850026130676, - "train/contrastive_loss": 2.2746901512145996, - "train/negative_loss": 1.6035470962524414, + "train/classification_loss": 0.2624529302120209, + "train/contrastive_loss": 2.2317891120910645, + "train/negative_loss": 2.2316646575927734, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6711429357528687, - "train/total_loss": 0.6307765245437622 + "train/num_positives": 2, + "train/positive_loss": 0.00012446223990991712, + "train/total_loss": 0.7088107466697693 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1557941436767578, - "train/contrastive_loss": 1.7099452018737793, - "train/negative_loss": 0.8394284248352051, + "train/classification_loss": 0.19717855751514435, + "train/contrastive_loss": 1.9128272533416748, + "train/negative_loss": 1.188171625137329, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.870516836643219, - "train/total_loss": 0.49778318405151367 + "train/num_positives": 16, + "train/positive_loss": 0.7246555685997009, + "train/total_loss": 0.5797440409660339 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.27869391441345215, - "train/contrastive_loss": 1.373921275138855, - "train/negative_loss": 1.2763222455978394, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.0975990816950798, - "train/total_loss": 0.5534781813621521 + "train/classification_loss": 0.1748032420873642, + "train/contrastive_loss": 0.8358477354049683, + "train/negative_loss": 0.5673885941505432, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.26845914125442505, + "train/total_loss": 0.34197279810905457 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.13523392379283905, - "train/contrastive_loss": 1.0375080108642578, - "train/negative_loss": 1.0300893783569336, - "train/num_negatives": 48, + "train/classification_loss": 0.22560089826583862, + "train/contrastive_loss": 0.820905864238739, + "train/negative_loss": 0.6663085222244263, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.007418673951178789, - "train/total_loss": 0.34273552894592285 + "train/positive_loss": 0.15459734201431274, + "train/total_loss": 0.3897820711135864 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.17994455993175507, - "train/contrastive_loss": 0.7380223274230957, - "train/negative_loss": 0.4432928264141083, + "train/classification_loss": 0.21513667702674866, + "train/contrastive_loss": 0.9757977724075317, + "train/negative_loss": 0.7348029613494873, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.2947295010089874, - "train/total_loss": 0.3275490403175354 + "train/num_positives": 14, + "train/positive_loss": 0.24099482595920563, + "train/total_loss": 0.410296231508255 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1203366294503212, - "train/contrastive_loss": 0.5977274775505066, - "train/negative_loss": 0.5719807147979736, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.025746772065758705, - "train/total_loss": 0.23988212645053864 + "train/classification_loss": 0.30533134937286377, + "train/contrastive_loss": 2.474186897277832, + "train/negative_loss": 1.445794701576233, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.0283920764923096, + "train/total_loss": 0.8001687526702881 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.21411095559597015, - "train/contrastive_loss": 0.5207065343856812, - "train/negative_loss": 0.367805540561676, - "train/num_negatives": 28, + "train/classification_loss": 0.1487395316362381, + "train/contrastive_loss": 0.9981712102890015, + "train/negative_loss": 0.6140452027320862, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.15290097892284393, - "train/total_loss": 0.3182522654533386 + "train/positive_loss": 0.38412603735923767, + "train/total_loss": 0.34837377071380615 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.18263360857963562, - "train/contrastive_loss": 2.0614097118377686, - "train/negative_loss": 1.1726405620574951, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.8887691497802734, - "train/total_loss": 0.5949155688285828 + "train/classification_loss": 0.1429874449968338, + "train/contrastive_loss": 0.6080282330513, + "train/negative_loss": 0.30353280901908875, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.3044954240322113, + "train/total_loss": 0.26459309458732605 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.17754122614860535, - "train/contrastive_loss": 0.9623854160308838, - "train/negative_loss": 0.7379752397537231, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.22441016137599945, - "train/total_loss": 0.3700183033943176 + "train/classification_loss": 0.17727260291576385, + "train/contrastive_loss": 1.2232487201690674, + "train/negative_loss": 1.0168335437774658, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.20641522109508514, + "train/total_loss": 0.42192235589027405 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19384483993053436, - "train/contrastive_loss": 2.8172123432159424, - "train/negative_loss": 0.9701177477836609, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.8470945358276367, - "train/total_loss": 0.757287323474884 + "train/classification_loss": 0.21506135165691376, + "train/contrastive_loss": 2.62617564201355, + "train/negative_loss": 1.3170585632324219, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.309117078781128, + "train/total_loss": 0.740296483039856 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2240847945213318, - "train/contrastive_loss": 2.2460079193115234, - "train/negative_loss": 1.1741838455200195, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.0718241930007935, - "train/total_loss": 0.6732863783836365 + "train/classification_loss": 0.22454994916915894, + "train/contrastive_loss": 1.4407482147216797, + "train/negative_loss": 1.1716587543487549, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.2690894603729248, + "train/total_loss": 0.5126996040344238 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19358791410923004, - "train/contrastive_loss": 1.0847373008728027, - "train/negative_loss": 0.5215328335762024, + "train/classification_loss": 0.1419769525527954, + "train/contrastive_loss": 0.2084272801876068, + "train/negative_loss": 0.143569216132164, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5632044672966003, - "train/total_loss": 0.41053539514541626 + "train/num_positives": 16, + "train/positive_loss": 0.06485805660486221, + "train/total_loss": 0.18366241455078125 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1738317459821701, - "train/contrastive_loss": 2.753288984298706, - "train/negative_loss": 1.558111548423767, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.195177435874939, - "train/total_loss": 0.7244895696640015 + "train/classification_loss": 0.20207370817661285, + "train/contrastive_loss": 3.027205467224121, + "train/negative_loss": 1.172908902168274, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.8542965650558472, + "train/total_loss": 0.8075147867202759 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.24972940981388092, - "train/contrastive_loss": 2.3591713905334473, - "train/negative_loss": 1.3022618293762207, + "train/classification_loss": 0.2549789845943451, + "train/contrastive_loss": 1.9599878787994385, + "train/negative_loss": 1.1245739459991455, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.0569095611572266, - "train/total_loss": 0.7215636968612671 + "train/num_positives": 2, + "train/positive_loss": 0.8354139924049377, + "train/total_loss": 0.6469765901565552 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.21654553711414337, - "train/contrastive_loss": 2.1127634048461914, - "train/negative_loss": 1.6598448753356934, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.4529185891151428, - "train/total_loss": 0.6390982270240784 + "train/classification_loss": 0.15109749138355255, + "train/contrastive_loss": 2.3361682891845703, + "train/negative_loss": 1.2406820058822632, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0954861640930176, + "train/total_loss": 0.6183311343193054 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.20146487653255463, - "train/contrastive_loss": 2.783494710922241, - "train/negative_loss": 1.443155288696289, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.3403394222259521, - "train/total_loss": 0.7581638693809509 + "train/classification_loss": 0.21592342853546143, + "train/contrastive_loss": 0.8044255375862122, + "train/negative_loss": 0.6018489003181458, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.2025766223669052, + "train/total_loss": 0.3768085241317749 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19968368113040924, - "train/contrastive_loss": 1.8613789081573486, - "train/negative_loss": 1.326163649559021, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5352153182029724, - "train/total_loss": 0.5719594955444336 + "train/classification_loss": 0.20050044357776642, + "train/contrastive_loss": 1.799804925918579, + "train/negative_loss": 0.44646501541137695, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.3533399105072021, + "train/total_loss": 0.5604614615440369 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.2273884117603302, - "train/contrastive_loss": 2.930764675140381, - "train/negative_loss": 2.2236998081207275, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.7070649266242981, - "train/total_loss": 0.8135414123535156 + "train/classification_loss": 0.19952112436294556, + "train/contrastive_loss": 3.3044862747192383, + "train/negative_loss": 3.3044817447662354, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 4.446522780199302e-06, + "train/total_loss": 0.8604183793067932 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.23322834074497223, - "train/contrastive_loss": 1.8649592399597168, - "train/negative_loss": 1.2806864976882935, + "train/classification_loss": 0.19301091134548187, + "train/contrastive_loss": 0.9563617706298828, + "train/negative_loss": 0.7286988496780396, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.5842728018760681, - "train/total_loss": 0.6062201857566833 + "train/positive_loss": 0.22766292095184326, + "train/total_loss": 0.38428327441215515 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.19247926771640778, - "train/contrastive_loss": 0.7928391098976135, - "train/negative_loss": 0.783078134059906, + "train/classification_loss": 0.22885334491729736, + "train/contrastive_loss": 2.997878074645996, + "train/negative_loss": 1.434131383895874, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.009760959073901176, - "train/total_loss": 0.3510470986366272 + "train/num_positives": 8, + "train/positive_loss": 1.5637468099594116, + "train/total_loss": 0.8284289836883545 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.1700798124074936, - "train/contrastive_loss": 1.0238678455352783, - "train/negative_loss": 0.3456326127052307, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6782351732254028, - "train/total_loss": 0.37485337257385254 + "train/classification_loss": 0.17190083861351013, + "train/contrastive_loss": 3.1119890213012695, + "train/negative_loss": 1.4986212253570557, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.6133679151535034, + "train/total_loss": 0.7942986488342285 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.17835398018360138, - "train/contrastive_loss": 1.531583309173584, - "train/negative_loss": 0.4798278510570526, - "train/num_negatives": 46, + "train/classification_loss": 0.2603514492511749, + "train/contrastive_loss": 2.2727572917938232, + "train/negative_loss": 1.4112029075622559, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.051755428314209, - "train/total_loss": 0.48467063903808594 + "train/positive_loss": 0.8615543842315674, + "train/total_loss": 0.7149028778076172 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.24467763304710388, - "train/contrastive_loss": 1.68598473072052, - "train/negative_loss": 1.68598473072052, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5818746089935303 - }, - { - "epoch": 6.4638783269961975, - "eval_exact_match_accuracy": 0.22095238095238096, - "eval_hamming_loss": 0.07361344537815126, - "eval_loss": 0.5771893262863159, - "eval_macro_f1": 0.17018142934860675, - "eval_macro_precision": 0.3269980080302193, - "eval_macro_recall": 0.12911413433970406, - "eval_micro_f1": 0.45112781954887216, - "eval_micro_precision": 0.8490566037735849, - "eval_micro_recall": 0.30716723549488056, - "eval_runtime": 2.6211, - "eval_samples_per_second": 200.296, - "eval_steps_per_second": 25.18, + "train/classification_loss": 0.19999635219573975, + "train/contrastive_loss": 1.228564739227295, + "train/negative_loss": 0.6873701214790344, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.5411945581436157, + "train/total_loss": 0.4457092881202698 + }, + { + "epoch": 5.985915492957746, + "eval_exact_match_accuracy": 0.2328042328042328, + "eval_hamming_loss": 0.0718954248366013, + "eval_loss": 0.5884774327278137, + "eval_macro_f1": 0.2116625113728062, + "eval_macro_precision": 0.3748543607342939, + "eval_macro_recall": 0.16463818743176792, + "eval_micro_f1": 0.4556166535742341, + "eval_micro_precision": 0.8656716417910447, + "eval_micro_recall": 0.3091684434968017, + "eval_runtime": 2.8433, + "eval_samples_per_second": 199.417, + "eval_steps_per_second": 24.971, "step": 1700 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.15760912001132965, - "train/contrastive_loss": 1.2662718296051025, - "train/negative_loss": 0.6921809315681458, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.574090838432312, - "train/total_loss": 0.4108635187149048 + "train/classification_loss": 0.18421414494514465, + "train/contrastive_loss": 1.2526923418045044, + "train/negative_loss": 1.1650878190994263, + "train/num_negatives": 54, + "train/num_positives": 2, + "train/positive_loss": 0.08760447800159454, + "train/total_loss": 0.43475261330604553 }, { - "epoch": 6.4638783269961975, + "epoch": 5.985915492957746, "step": 1700, - "train/classification_loss": 0.18905743956565857, - "train/contrastive_loss": 1.7470701932907104, - "train/negative_loss": 1.0131630897521973, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.7339071035385132, - "train/total_loss": 0.5384714603424072 + "train/classification_loss": 0.23508144915103912, + "train/contrastive_loss": 2.827434539794922, + "train/negative_loss": 1.0404642820358276, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 1.7869703769683838, + "train/total_loss": 0.8005683422088623 }, { - "epoch": 6.653992395437262, - "grad_norm": 16.15435028076172, - "learning_rate": 1.9749315068493153e-05, - "loss": 0.8409, + "epoch": 6.161971830985916, + "grad_norm": 14.457427978515625, + "learning_rate": 1.9768005637773083e-05, + "loss": 0.7991, "step": 1750 }, { - "epoch": 6.653992395437262, + "epoch": 6.161971830985916, "step": 1750, - "train/classification_loss": 0.16006724536418915, - "train/contrastive_loss": 1.215085744857788, - "train/negative_loss": 0.6944472789764404, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5206384658813477, - "train/total_loss": 0.403084397315979 + "train/classification_loss": 0.20019212365150452, + "train/contrastive_loss": 0.8180999159812927, + "train/negative_loss": 0.8180310130119324, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 6.890534132253379e-05, + "train/total_loss": 0.36381208896636963 }, { - "epoch": 6.653992395437262, + "epoch": 6.161971830985916, "step": 1750, - "train/classification_loss": 0.16344404220581055, - "train/contrastive_loss": 0.4790329337120056, - "train/negative_loss": 0.47518783807754517, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.0038451040163636208, - "train/total_loss": 0.2592506408691406 + "train/classification_loss": 0.17518675327301025, + "train/contrastive_loss": 0.8647081851959229, + "train/negative_loss": 0.5790228843688965, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.28568530082702637, + "train/total_loss": 0.34812837839126587 }, { - "epoch": 6.844106463878327, - "grad_norm": 10.93616008758545, - "learning_rate": 1.974170471841705e-05, - "loss": 0.8203, + "epoch": 6.338028169014084, + "grad_norm": 8.555068016052246, + "learning_rate": 1.976095842142354e-05, + "loss": 0.8147, "step": 1800 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24718542397022247, - "train/contrastive_loss": 1.3273639678955078, - "train/negative_loss": 0.4558310806751251, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8715329170227051, - "train/total_loss": 0.5126582384109497 + "train/classification_loss": 0.23618440330028534, + "train/contrastive_loss": 2.4996490478515625, + "train/negative_loss": 0.9613112211227417, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.5383377075195312, + "train/total_loss": 0.7361142039299011 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.22704379260540009, - "train/contrastive_loss": 2.034367799758911, - "train/negative_loss": 1.2144545316696167, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.8199133276939392, - "train/total_loss": 0.6339173316955566 + "train/classification_loss": 0.2643356919288635, + "train/contrastive_loss": 1.064527988433838, + "train/negative_loss": 0.4917549788951874, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5727729797363281, + "train/total_loss": 0.47724127769470215 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1658373326063156, - "train/contrastive_loss": 2.045210838317871, - "train/negative_loss": 0.9495800733566284, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0956306457519531, - "train/total_loss": 0.57487952709198 + "train/classification_loss": 0.2525252103805542, + "train/contrastive_loss": 2.6638693809509277, + "train/negative_loss": 1.0702341794967651, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.593635082244873, + "train/total_loss": 0.7852991223335266 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18691794574260712, - "train/contrastive_loss": 2.8457865715026855, - "train/negative_loss": 1.8239173889160156, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.0218690633773804, - "train/total_loss": 0.7560752630233765 + "train/classification_loss": 0.13786518573760986, + "train/contrastive_loss": 0.6768171787261963, + "train/negative_loss": 0.5316019654273987, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.14521524310112, + "train/total_loss": 0.27322864532470703 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.14641442894935608, - "train/contrastive_loss": 1.2959307432174683, - "train/negative_loss": 1.0943429470062256, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.2015877515077591, - "train/total_loss": 0.40560057759284973 + "train/classification_loss": 0.20317767560482025, + "train/contrastive_loss": 2.362442970275879, + "train/negative_loss": 2.241147518157959, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.1212954893708229, + "train/total_loss": 0.6756662726402283 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18013876676559448, - "train/contrastive_loss": 2.1482126712799072, - "train/negative_loss": 1.623271107673645, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.5249415040016174, - "train/total_loss": 0.6097812652587891 + "train/classification_loss": 0.20733687281608582, + "train/contrastive_loss": 2.196223020553589, + "train/negative_loss": 1.3789563179016113, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8172667026519775, + "train/total_loss": 0.6465814709663391 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.23120087385177612, - "train/contrastive_loss": 1.141149878501892, - "train/negative_loss": 1.0805281400680542, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.060621701180934906, - "train/total_loss": 0.45943087339401245 + "train/classification_loss": 0.1985493302345276, + "train/contrastive_loss": 1.9548351764678955, + "train/negative_loss": 0.8695181012153625, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.0853171348571777, + "train/total_loss": 0.5895164012908936 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.16650141775608063, - "train/contrastive_loss": 1.0847113132476807, - "train/negative_loss": 0.9511285424232483, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.13358280062675476, - "train/total_loss": 0.383443683385849 + "train/classification_loss": 0.20806984603405, + "train/contrastive_loss": 1.0504621267318726, + "train/negative_loss": 1.049856424331665, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0006056473357602954, + "train/total_loss": 0.4181622862815857 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.15409955382347107, - "train/contrastive_loss": 1.262139916419983, - "train/negative_loss": 1.253958821296692, + "train/classification_loss": 0.13133777678012848, + "train/contrastive_loss": 0.6291182637214661, + "train/negative_loss": 0.45217472314834595, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.008181067183613777, - "train/total_loss": 0.4065275490283966 + "train/positive_loss": 0.17694354057312012, + "train/total_loss": 0.2571614384651184 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.30725425481796265, - "train/contrastive_loss": 3.194790840148926, - "train/negative_loss": 1.243918538093567, + "train/classification_loss": 0.20885518193244934, + "train/contrastive_loss": 1.6074930429458618, + "train/negative_loss": 1.3285659551620483, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.9508721828460693, - "train/total_loss": 0.9462124109268188 + "train/num_positives": 14, + "train/positive_loss": 0.27892711758613586, + "train/total_loss": 0.5303537845611572 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.19303932785987854, - "train/contrastive_loss": 1.842782974243164, - "train/negative_loss": 1.4596999883651733, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.38308292627334595, - "train/total_loss": 0.5615959167480469 + "train/classification_loss": 0.16874989867210388, + "train/contrastive_loss": 1.2389817237854004, + "train/negative_loss": 0.8842199444770813, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3547617197036743, + "train/total_loss": 0.4165462255477905 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.12159647792577744, - "train/contrastive_loss": 0.560375988483429, - "train/negative_loss": 0.41072529554367065, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.1496506780385971, - "train/total_loss": 0.23367168009281158 + "train/classification_loss": 0.18696634471416473, + "train/contrastive_loss": 1.7192937135696411, + "train/negative_loss": 1.7190954685211182, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.0001982092799153179, + "train/total_loss": 0.5308250784873962 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.2652417719364166, - "train/contrastive_loss": 4.690550804138184, - "train/negative_loss": 2.5094735622406006, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.181077003479004, - "train/total_loss": 1.2033519744873047 + "train/classification_loss": 0.2098003774881363, + "train/contrastive_loss": 3.7497010231018066, + "train/negative_loss": 2.165863037109375, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.5838379859924316, + "train/total_loss": 0.9597405791282654 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.14213475584983826, - "train/contrastive_loss": 2.65765643119812, - "train/negative_loss": 2.651808500289917, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.005847997032105923, - "train/total_loss": 0.6736660003662109 + "train/classification_loss": 0.1998313069343567, + "train/contrastive_loss": 1.3455989360809326, + "train/negative_loss": 0.9798943996429443, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.3657044768333435, + "train/total_loss": 0.46895110607147217 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.13620984554290771, - "train/contrastive_loss": 1.7645483016967773, - "train/negative_loss": 1.53364098072052, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.23090730607509613, - "train/total_loss": 0.4891194999217987 + "train/classification_loss": 0.14849337935447693, + "train/contrastive_loss": 2.0187861919403076, + "train/negative_loss": 0.6614004969596863, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.3573856353759766, + "train/total_loss": 0.5522506237030029 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.15064281225204468, - "train/contrastive_loss": 0.8089166283607483, - "train/negative_loss": 0.8037953972816467, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.005121228285133839, - "train/total_loss": 0.3124261498451233 + "train/classification_loss": 0.18422512710094452, + "train/contrastive_loss": 1.5316643714904785, + "train/negative_loss": 0.697216808795929, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.8344475626945496, + "train/total_loss": 0.49055802822113037 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24252475798130035, - "train/contrastive_loss": 2.834036350250244, - "train/negative_loss": 1.597424864768982, - "train/num_negatives": 40, + "train/classification_loss": 0.14369253814220428, + "train/contrastive_loss": 1.3306763172149658, + "train/negative_loss": 0.7949985265731812, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.2366116046905518, - "train/total_loss": 0.809332013130188 + "train/positive_loss": 0.5356777310371399, + "train/total_loss": 0.4098278284072876 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1735846847295761, - "train/contrastive_loss": 0.8815721273422241, - "train/negative_loss": 0.37989696860313416, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.5016751885414124, - "train/total_loss": 0.3498991131782532 + "train/classification_loss": 0.20878709852695465, + "train/contrastive_loss": 1.59965980052948, + "train/negative_loss": 1.4177470207214355, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.18191276490688324, + "train/total_loss": 0.5287190675735474 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.21319997310638428, - "train/contrastive_loss": 1.9631239175796509, - "train/negative_loss": 1.8245694637298584, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.13855448365211487, - "train/total_loss": 0.6058247685432434 + "train/classification_loss": 0.1755540668964386, + "train/contrastive_loss": 0.5103244781494141, + "train/negative_loss": 0.47977203130722046, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.030552471056580544, + "train/total_loss": 0.27761897444725037 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.16779378056526184, - "train/contrastive_loss": 2.264986276626587, - "train/negative_loss": 1.9267170429229736, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.3382691442966461, - "train/total_loss": 0.6207910776138306 + "train/classification_loss": 0.19091834127902985, + "train/contrastive_loss": 3.2964799404144287, + "train/negative_loss": 1.5835227966308594, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.7129571437835693, + "train/total_loss": 0.8502143025398254 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.26110127568244934, - "train/contrastive_loss": 1.814990520477295, - "train/negative_loss": 0.7181379199028015, - "train/num_negatives": 44, + "train/classification_loss": 0.15718308091163635, + "train/contrastive_loss": 1.6903914213180542, + "train/negative_loss": 1.6703453063964844, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.0968526601791382, - "train/total_loss": 0.6240993738174438 + "train/positive_loss": 0.020046083256602287, + "train/total_loss": 0.49526137113571167 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24143920838832855, - "train/contrastive_loss": 1.5418623685836792, - "train/negative_loss": 1.4387538433074951, - "train/num_negatives": 44, + "train/classification_loss": 0.13766010105609894, + "train/contrastive_loss": 2.6639468669891357, + "train/negative_loss": 1.8816156387329102, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.1031084731221199, - "train/total_loss": 0.5498116612434387 + "train/positive_loss": 0.7823312282562256, + "train/total_loss": 0.6704494953155518 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.13931678235530853, - "train/contrastive_loss": 0.852718710899353, - "train/negative_loss": 0.3396717607975006, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.5130469799041748, - "train/total_loss": 0.3098605275154114 + "train/classification_loss": 0.1847010850906372, + "train/contrastive_loss": 2.585862636566162, + "train/negative_loss": 1.293681263923645, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.2921814918518066, + "train/total_loss": 0.7018736004829407 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.14122585952281952, - "train/contrastive_loss": 0.35162150859832764, - "train/negative_loss": 0.3497757613658905, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.001845743739977479, - "train/total_loss": 0.21155016124248505 + "train/classification_loss": 0.24528996646404266, + "train/contrastive_loss": 3.4418249130249023, + "train/negative_loss": 1.574407696723938, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.8674172163009644, + "train/total_loss": 0.9336549639701843 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.12434650957584381, - "train/contrastive_loss": 1.636486530303955, - "train/negative_loss": 1.5663236379623413, + "train/classification_loss": 0.18155448138713837, + "train/contrastive_loss": 2.0227980613708496, + "train/negative_loss": 0.8087050914764404, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.07016285508871078, - "train/total_loss": 0.45164382457733154 + "train/num_positives": 10, + "train/positive_loss": 1.2140930891036987, + "train/total_loss": 0.5861141085624695 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.25728076696395874, - "train/contrastive_loss": 1.1682240962982178, - "train/negative_loss": 0.4004468023777008, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.7677773237228394, - "train/total_loss": 0.4909256100654602 + "train/classification_loss": 0.2012697458267212, + "train/contrastive_loss": 2.402578592300415, + "train/negative_loss": 1.9920814037322998, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.41049715876579285, + "train/total_loss": 0.6817854642868042 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.2691647708415985, - "train/contrastive_loss": 2.9926323890686035, - "train/negative_loss": 1.5942788124084473, + "train/classification_loss": 0.20460467040538788, + "train/contrastive_loss": 1.5915348529815674, + "train/negative_loss": 1.58004891872406, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3983535766601562, - "train/total_loss": 0.8676912784576416 + "train/num_positives": 4, + "train/positive_loss": 0.011485951952636242, + "train/total_loss": 0.5229116678237915 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18355832993984222, - "train/contrastive_loss": 2.1194846630096436, - "train/negative_loss": 1.9304311275482178, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.18905344605445862, - "train/total_loss": 0.6074552536010742 + "train/classification_loss": 0.1931326985359192, + "train/contrastive_loss": 0.20014992356300354, + "train/negative_loss": 0.18774820864200592, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.012401716783642769, + "train/total_loss": 0.23316268622875214 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.20397204160690308, - "train/contrastive_loss": 1.233396291732788, - "train/negative_loss": 0.551781952381134, - "train/num_negatives": 40, + "train/classification_loss": 0.2523374557495117, + "train/contrastive_loss": 3.8048558235168457, + "train/negative_loss": 1.7720197439193726, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6816143989562988, - "train/total_loss": 0.45065128803253174 - }, - { - "epoch": 6.844106463878327, - "step": 1800, - "train/classification_loss": 0.21549808979034424, - "train/contrastive_loss": 1.294891357421875, - "train/negative_loss": 0.940403163433075, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.3544882535934448, - "train/total_loss": 0.4744763672351837 - }, - { - "epoch": 6.844106463878327, - "step": 1800, - "train/classification_loss": 0.15361271798610687, - "train/contrastive_loss": 1.5948383808135986, - "train/negative_loss": 1.1710091829299927, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.42382919788360596, - "train/total_loss": 0.4725803732872009 + "train/positive_loss": 2.0328359603881836, + "train/total_loss": 1.0133086442947388 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24327901005744934, - "train/contrastive_loss": 3.2757797241210938, - "train/negative_loss": 2.221092700958252, + "train/classification_loss": 0.2193804532289505, + "train/contrastive_loss": 0.9227731823921204, + "train/negative_loss": 0.9027462005615234, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0546870231628418, - "train/total_loss": 0.8984349966049194 + "train/num_positives": 10, + "train/positive_loss": 0.020026957616209984, + "train/total_loss": 0.4039350748062134 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.22694382071495056, - "train/contrastive_loss": 0.5336241722106934, - "train/negative_loss": 0.5318108201026917, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0018133262638002634, - "train/total_loss": 0.33366864919662476 + "train/classification_loss": 0.16964419186115265, + "train/contrastive_loss": 1.3177131414413452, + "train/negative_loss": 1.3112902641296387, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.006422827020287514, + "train/total_loss": 0.4331868290901184 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.21941176056861877, - "train/contrastive_loss": 2.449995994567871, - "train/negative_loss": 1.4631177186965942, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.9868783354759216, - "train/total_loss": 0.7094109654426575 + "train/classification_loss": 0.1795284003019333, + "train/contrastive_loss": 1.8620396852493286, + "train/negative_loss": 1.4069775342941284, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.4550621509552002, + "train/total_loss": 0.5519363284111023 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.21619711816310883, - "train/contrastive_loss": 4.843829154968262, - "train/negative_loss": 2.602778673171997, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.2410502433776855, - "train/total_loss": 1.1849629878997803 + "train/classification_loss": 0.19057753682136536, + "train/contrastive_loss": 1.9349257946014404, + "train/negative_loss": 1.1791791915893555, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7557465434074402, + "train/total_loss": 0.577562689781189 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18410266935825348, - "train/contrastive_loss": 3.7518677711486816, - "train/negative_loss": 2.003365993499756, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7485018968582153, - "train/total_loss": 0.9344761967658997 + "train/classification_loss": 0.21294724941253662, + "train/contrastive_loss": 2.0243303775787354, + "train/negative_loss": 1.519113302230835, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.5052170157432556, + "train/total_loss": 0.6178133487701416 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.16783694922924042, - "train/contrastive_loss": 1.2611719369888306, - "train/negative_loss": 1.0960545539855957, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.16511736810207367, - "train/total_loss": 0.4200713634490967 + "train/classification_loss": 0.24014151096343994, + "train/contrastive_loss": 2.0354576110839844, + "train/negative_loss": 0.8759483098983765, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.1595091819763184, + "train/total_loss": 0.6472330093383789 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.19486811757087708, - "train/contrastive_loss": 1.5325144529342651, - "train/negative_loss": 1.0833574533462524, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.4491569995880127, - "train/total_loss": 0.5013710260391235 + "train/classification_loss": 0.15081846714019775, + "train/contrastive_loss": 1.7187182903289795, + "train/negative_loss": 1.7186675071716309, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 5.083685027784668e-05, + "train/total_loss": 0.4945621192455292 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.21038618683815002, - "train/contrastive_loss": 2.2118375301361084, - "train/negative_loss": 2.1096384525299072, + "train/classification_loss": 0.21892698109149933, + "train/contrastive_loss": 0.8051426410675049, + "train/negative_loss": 0.39136651158332825, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.10219912976026535, - "train/total_loss": 0.6527537107467651 + "train/positive_loss": 0.413776159286499, + "train/total_loss": 0.379955530166626 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.19027374684810638, - "train/contrastive_loss": 2.3098785877227783, - "train/negative_loss": 2.3023293018341064, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.007549218833446503, - "train/total_loss": 0.6522494554519653 + "train/classification_loss": 0.2578733563423157, + "train/contrastive_loss": 2.6372523307800293, + "train/negative_loss": 2.32843017578125, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.30882227420806885, + "train/total_loss": 0.7853238582611084 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.21549485623836517, + "train/contrastive_loss": 0.7917541265487671, + "train/negative_loss": 0.43763402104377747, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.35412007570266724, + "train/total_loss": 0.3738456964492798 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.282681405544281, + "train/contrastive_loss": 3.414781093597412, + "train/negative_loss": 2.166337251663208, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 1.2484439611434937, + "train/total_loss": 0.9656376242637634 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.14941991865634918, + "train/contrastive_loss": 0.9621403217315674, + "train/negative_loss": 0.629996657371521, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.332143634557724, + "train/total_loss": 0.3418479859828949 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.17254632711410522, + "train/contrastive_loss": 2.058793544769287, + "train/negative_loss": 1.2110460996627808, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.8477475643157959, + "train/total_loss": 0.5843050479888916 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.1880212128162384, + "train/contrastive_loss": 0.8820734024047852, + "train/negative_loss": 0.8819945454597473, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 7.886016828706488e-05, + "train/total_loss": 0.36443591117858887 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18013280630111694, - "train/contrastive_loss": 1.1409265995025635, - "train/negative_loss": 1.0742335319519043, + "train/classification_loss": 0.2603602111339569, + "train/contrastive_loss": 1.15123450756073, + "train/negative_loss": 1.1470509767532349, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.066693015396595, - "train/total_loss": 0.4083181321620941 + "train/positive_loss": 0.004183569457381964, + "train/total_loss": 0.4906071126461029 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.19509540498256683, - "train/contrastive_loss": 2.1398746967315674, - "train/negative_loss": 1.7655938863754272, - "train/num_negatives": 36, + "train/classification_loss": 0.1882232129573822, + "train/contrastive_loss": 0.6139564514160156, + "train/negative_loss": 0.6025113463401794, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.011445131152868271, + "train/total_loss": 0.3110145032405853 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.3184067904949188, + "train/contrastive_loss": 3.5926332473754883, + "train/negative_loss": 2.827404022216797, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.37428078055381775, - "train/total_loss": 0.6230703592300415 + "train/positive_loss": 0.7652291059494019, + "train/total_loss": 1.036933422088623 + }, + { + "epoch": 6.338028169014084, + "step": 1800, + "train/classification_loss": 0.17019306123256683, + "train/contrastive_loss": 1.4210273027420044, + "train/negative_loss": 1.062803864479065, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.35822346806526184, + "train/total_loss": 0.454398512840271 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.22948279976844788, - "train/contrastive_loss": 1.271140456199646, - "train/negative_loss": 0.5134792327880859, + "train/classification_loss": 0.21009114384651184, + "train/contrastive_loss": 2.857487916946411, + "train/negative_loss": 2.3472461700439453, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.7576612234115601, - "train/total_loss": 0.4837108850479126 + "train/num_positives": 14, + "train/positive_loss": 0.5102417469024658, + "train/total_loss": 0.7815887928009033 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.16807900369167328, - "train/contrastive_loss": 2.7441728115081787, - "train/negative_loss": 1.3006181716918945, + "train/classification_loss": 0.25049540400505066, + "train/contrastive_loss": 2.4972052574157715, + "train/negative_loss": 2.497196912765503, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4435546398162842, - "train/total_loss": 0.7169135808944702 + "train/num_positives": 2, + "train/positive_loss": 8.225474630307872e-06, + "train/total_loss": 0.7499364614486694 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.14641965925693512, - "train/contrastive_loss": 1.0180872678756714, - "train/negative_loss": 0.550064742565155, + "train/classification_loss": 0.20436859130859375, + "train/contrastive_loss": 1.9877409934997559, + "train/negative_loss": 0.980452835559845, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.46802249550819397, - "train/total_loss": 0.3500370979309082 + "train/num_positives": 16, + "train/positive_loss": 1.0072880983352661, + "train/total_loss": 0.6019167900085449 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.29122111201286316, - "train/contrastive_loss": 2.198141098022461, - "train/negative_loss": 0.9598488211631775, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.2382923364639282, - "train/total_loss": 0.7308493256568909 + "train/classification_loss": 0.15812022984027863, + "train/contrastive_loss": 0.2669823169708252, + "train/negative_loss": 0.19041016697883606, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.07657214254140854, + "train/total_loss": 0.21151669323444366 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.12605565786361694, - "train/contrastive_loss": 0.9111488461494446, - "train/negative_loss": 0.9111378192901611, - "train/num_negatives": 48, + "train/classification_loss": 0.21329163014888763, + "train/contrastive_loss": 0.8076227307319641, + "train/negative_loss": 0.6478399634361267, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 1.1026937499991618e-05, - "train/total_loss": 0.3082854151725769 + "train/positive_loss": 0.1597827672958374, + "train/total_loss": 0.3748161792755127 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1596829742193222, - "train/contrastive_loss": 0.20777921378612518, - "train/negative_loss": 0.1834155023097992, + "train/classification_loss": 0.21620073914527893, + "train/contrastive_loss": 0.8952352404594421, + "train/negative_loss": 0.8577362895011902, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.02436370961368084, - "train/total_loss": 0.20123881101608276 + "train/num_positives": 14, + "train/positive_loss": 0.03749896213412285, + "train/total_loss": 0.39524778723716736 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.11509941518306732, - "train/contrastive_loss": 1.0395621061325073, - "train/negative_loss": 1.030341386795044, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.009220683015882969, - "train/total_loss": 0.3230118453502655 + "train/classification_loss": 0.30255407094955444, + "train/contrastive_loss": 2.703613758087158, + "train/negative_loss": 1.199798822402954, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.5038150548934937, + "train/total_loss": 0.843276858329773 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.20567600429058075, - "train/contrastive_loss": 1.1388304233551025, - "train/negative_loss": 1.1341861486434937, - "train/num_negatives": 28, + "train/classification_loss": 0.14780624210834503, + "train/contrastive_loss": 1.1930758953094482, + "train/negative_loss": 0.36876219511032104, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.0046442365273833275, - "train/total_loss": 0.433442085981369 + "train/positive_loss": 0.824313759803772, + "train/total_loss": 0.38642144203186035 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.17609809339046478, - "train/contrastive_loss": 1.8256901502609253, - "train/negative_loss": 1.387337327003479, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4383528530597687, - "train/total_loss": 0.5412361025810242 + "train/classification_loss": 0.14649800956249237, + "train/contrastive_loss": 1.084219217300415, + "train/negative_loss": 0.3242172300815582, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.7600019574165344, + "train/total_loss": 0.3633418679237366 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1731565296649933, - "train/contrastive_loss": 0.6739047169685364, - "train/negative_loss": 0.6736093759536743, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00029536051442846656, - "train/total_loss": 0.30793747305870056 + "train/classification_loss": 0.1859196573495865, + "train/contrastive_loss": 2.993258237838745, + "train/negative_loss": 0.9514286518096924, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.0418295860290527, + "train/total_loss": 0.7845712900161743 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1878020465373993, - "train/contrastive_loss": 1.817173719406128, - "train/negative_loss": 0.8008537292480469, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.016319990158081, - "train/total_loss": 0.5512368083000183 + "train/classification_loss": 0.20863163471221924, + "train/contrastive_loss": 2.637061834335327, + "train/negative_loss": 1.389975666999817, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.2470861673355103, + "train/total_loss": 0.7360439896583557 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.22236162424087524, - "train/contrastive_loss": 1.8347773551940918, - "train/negative_loss": 1.4520273208618164, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.382750004529953, - "train/total_loss": 0.5893170833587646 + "train/classification_loss": 0.21374037861824036, + "train/contrastive_loss": 1.1649141311645508, + "train/negative_loss": 0.9411524534225464, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.22376161813735962, + "train/total_loss": 0.44672322273254395 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.15086911618709564, - "train/contrastive_loss": 0.48911604285240173, - "train/negative_loss": 0.400454044342041, + "train/classification_loss": 0.13585400581359863, + "train/contrastive_loss": 0.2632651627063751, + "train/negative_loss": 0.24225668609142303, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.08866199105978012, - "train/total_loss": 0.2486923336982727 + "train/num_positives": 16, + "train/positive_loss": 0.021008474752306938, + "train/total_loss": 0.18850703537464142 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.17545746266841888, - "train/contrastive_loss": 2.8347887992858887, - "train/negative_loss": 2.2172977924346924, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6174910068511963, - "train/total_loss": 0.7424152493476868 + "train/classification_loss": 0.19233687222003937, + "train/contrastive_loss": 2.8636417388916016, + "train/negative_loss": 1.3234347105026245, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.5402069091796875, + "train/total_loss": 0.7650651931762695 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.23916059732437134, - "train/contrastive_loss": 2.4696121215820312, - "train/negative_loss": 1.4405335187911987, + "train/classification_loss": 0.26650911569595337, + "train/contrastive_loss": 1.9120588302612305, + "train/negative_loss": 1.7381545305252075, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.029078722000122, - "train/total_loss": 0.7330830097198486 + "train/num_positives": 2, + "train/positive_loss": 0.17390435934066772, + "train/total_loss": 0.6489208936691284 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.21360935270786285, - "train/contrastive_loss": 2.329637050628662, - "train/negative_loss": 1.6897577047348022, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6398792862892151, - "train/total_loss": 0.679536759853363 + "train/classification_loss": 0.1460341066122055, + "train/contrastive_loss": 1.1903585195541382, + "train/negative_loss": 0.9340766668319702, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.2562818229198456, + "train/total_loss": 0.3841058015823364 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1832314133644104, - "train/contrastive_loss": 2.906201124191284, - "train/negative_loss": 2.4322071075439453, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4739939272403717, - "train/total_loss": 0.7644716501235962 + "train/classification_loss": 0.19368679821491241, + "train/contrastive_loss": 0.8795298337936401, + "train/negative_loss": 0.7353776693344116, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.14415216445922852, + "train/total_loss": 0.3695927858352661 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.22464171051979065, - "train/contrastive_loss": 3.2753419876098633, - "train/negative_loss": 2.215752601623535, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.0595893859863281, - "train/total_loss": 0.8797100782394409 + "train/classification_loss": 0.19111137092113495, + "train/contrastive_loss": 1.9831018447875977, + "train/negative_loss": 0.8209530711174011, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.1621488332748413, + "train/total_loss": 0.5877317190170288 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.2104712426662445, - "train/contrastive_loss": 4.315834999084473, - "train/negative_loss": 3.713897466659546, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.6019375920295715, - "train/total_loss": 1.0736382007598877 + "train/classification_loss": 0.20079556107521057, + "train/contrastive_loss": 5.566178321838379, + "train/negative_loss": 5.566175937652588, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.3841892016207566e-06, + "train/total_loss": 1.3140312433242798 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24290253221988678, - "train/contrastive_loss": 2.635499954223633, - "train/negative_loss": 1.7884712219238281, + "train/classification_loss": 0.190120667219162, + "train/contrastive_loss": 0.8163983821868896, + "train/negative_loss": 0.39662086963653564, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.8470288515090942, - "train/total_loss": 0.770002543926239 + "train/positive_loss": 0.4197775423526764, + "train/total_loss": 0.3534003496170044 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.18409913778305054, - "train/contrastive_loss": 0.5596603155136108, - "train/negative_loss": 0.5562171936035156, + "train/classification_loss": 0.21868683397769928, + "train/contrastive_loss": 2.932465076446533, + "train/negative_loss": 1.7568747997283936, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0034431132953613997, - "train/total_loss": 0.2960312068462372 + "train/num_positives": 8, + "train/positive_loss": 1.1755903959274292, + "train/total_loss": 0.8051798343658447 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.17445294559001923, - "train/contrastive_loss": 1.3158659934997559, - "train/negative_loss": 0.7218444347381592, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5940216183662415, - "train/total_loss": 0.4376261234283447 + "train/classification_loss": 0.1656399667263031, + "train/contrastive_loss": 1.8630726337432861, + "train/negative_loss": 0.8169066905975342, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.046165943145752, + "train/total_loss": 0.5382544994354248 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1795436590909958, - "train/contrastive_loss": 1.818366527557373, - "train/negative_loss": 0.7833738923072815, - "train/num_negatives": 46, + "train/classification_loss": 0.25913915038108826, + "train/contrastive_loss": 1.9436025619506836, + "train/negative_loss": 1.7970094680786133, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0349926948547363, - "train/total_loss": 0.5432169437408447 + "train/positive_loss": 0.14659306406974792, + "train/total_loss": 0.6478596925735474 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.24529393017292023, - "train/contrastive_loss": 1.4335335493087769, - "train/negative_loss": 1.4335335493087769, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5320006608963013 - }, - { - "epoch": 6.844106463878327, - "eval_exact_match_accuracy": 0.26476190476190475, - "eval_hamming_loss": 0.06980392156862746, - "eval_loss": 0.5701467394828796, - "eval_macro_f1": 0.22440961510593738, - "eval_macro_precision": 0.5265725916973413, - "eval_macro_recall": 0.17414232009191752, - "eval_micro_f1": 0.5113725490196078, - "eval_micro_precision": 0.8232323232323232, - "eval_micro_recall": 0.3708759954493743, - "eval_runtime": 2.6208, - "eval_samples_per_second": 200.321, - "eval_steps_per_second": 25.183, + "train/classification_loss": 0.19009657204151154, + "train/contrastive_loss": 1.6608723402023315, + "train/negative_loss": 1.394348382949829, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.26652395725250244, + "train/total_loss": 0.5222710371017456 + }, + { + "epoch": 6.338028169014084, + "eval_exact_match_accuracy": 0.24691358024691357, + "eval_hamming_loss": 0.0718954248366013, + "eval_loss": 0.5680800080299377, + "eval_macro_f1": 0.2427411732331366, + "eval_macro_precision": 0.47275031413037283, + "eval_macro_recall": 0.19414416262327208, + "eval_micro_f1": 0.4746019711902957, + "eval_micro_precision": 0.821522309711286, + "eval_micro_recall": 0.3336886993603412, + "eval_runtime": 2.8484, + "eval_samples_per_second": 199.062, + "eval_steps_per_second": 24.927, "step": 1800 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.1748284250497818, - "train/contrastive_loss": 0.8777519464492798, - "train/negative_loss": 0.8727569580078125, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.004994993098080158, - "train/total_loss": 0.3503788113594055 + "train/classification_loss": 0.1515735685825348, + "train/contrastive_loss": 0.8138993382453918, + "train/negative_loss": 0.6973198056221008, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.11657953262329102, + "train/total_loss": 0.31435343623161316 }, { - "epoch": 6.844106463878327, + "epoch": 6.338028169014084, "step": 1800, - "train/classification_loss": 0.16796070337295532, - "train/contrastive_loss": 0.7820920348167419, - "train/negative_loss": 0.756605863571167, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.025486182421445847, - "train/total_loss": 0.3243791162967682 + "train/classification_loss": 0.18316659331321716, + "train/contrastive_loss": 1.312180757522583, + "train/negative_loss": 0.9477595686912537, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3644212484359741, + "train/total_loss": 0.44560274481773376 }, { - "epoch": 7.034220532319392, - "grad_norm": 9.459121704101562, - "learning_rate": 1.9734094368340946e-05, - "loss": 0.8097, + "epoch": 6.514084507042254, + "grad_norm": 30.647846221923828, + "learning_rate": 1.9753911205073996e-05, + "loss": 0.7836, "step": 1850 }, { - "epoch": 7.034220532319392, + "epoch": 6.514084507042254, "step": 1850, - "train/classification_loss": 0.14938408136367798, - "train/contrastive_loss": 0.6288790702819824, - "train/negative_loss": 0.6266802549362183, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.0021988386288285255, - "train/total_loss": 0.27515989542007446 + "train/classification_loss": 0.13582298159599304, + "train/contrastive_loss": 0.8106577396392822, + "train/negative_loss": 0.49388763308525085, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.31677013635635376, + "train/total_loss": 0.2979545295238495 }, { - "epoch": 7.034220532319392, + "epoch": 6.514084507042254, "step": 1850, - "train/classification_loss": 0.14405231177806854, - "train/contrastive_loss": 0.25956884026527405, - "train/negative_loss": 0.24571874737739563, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 0.013850104995071888, - "train/total_loss": 0.19596607983112335 + "train/classification_loss": 0.21405598521232605, + "train/contrastive_loss": 1.100415587425232, + "train/negative_loss": 0.6814552545547485, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.4189603328704834, + "train/total_loss": 0.43413910269737244 }, { - "epoch": 7.224334600760456, - "grad_norm": 8.780190467834473, - "learning_rate": 1.9726484018264844e-05, - "loss": 0.727, + "epoch": 6.690140845070422, + "grad_norm": 12.289376258850098, + "learning_rate": 1.9746863988724457e-05, + "loss": 0.8155, "step": 1900 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.26934614777565, - "train/contrastive_loss": 1.655250906944275, - "train/negative_loss": 0.9808627963066101, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.6743881106376648, - "train/total_loss": 0.6003963351249695 + "train/classification_loss": 0.23372109234333038, + "train/contrastive_loss": 3.2158899307250977, + "train/negative_loss": 1.3862863779067993, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.829603672027588, + "train/total_loss": 0.8768990635871887 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.22692139446735382, - "train/contrastive_loss": 2.6190361976623535, - "train/negative_loss": 1.417634129524231, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.201401948928833, - "train/total_loss": 0.7507286071777344 + "train/classification_loss": 0.27038395404815674, + "train/contrastive_loss": 0.7699598073959351, + "train/negative_loss": 0.599881649017334, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.17007815837860107, + "train/total_loss": 0.4243759214878082 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.17449703812599182, - "train/contrastive_loss": 1.8056697845458984, - "train/negative_loss": 0.41948631405830383, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.386183500289917, - "train/total_loss": 0.535631000995636 + "train/classification_loss": 0.23821960389614105, + "train/contrastive_loss": 2.791719913482666, + "train/negative_loss": 1.4407185316085815, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.351001262664795, + "train/total_loss": 0.7965636253356934 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2034793496131897, - "train/contrastive_loss": 2.0835914611816406, - "train/negative_loss": 1.3412920236587524, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.7422994375228882, - "train/total_loss": 0.6201976537704468 + "train/classification_loss": 0.14065875113010406, + "train/contrastive_loss": 1.65958571434021, + "train/negative_loss": 0.9428386092185974, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.7167471051216125, + "train/total_loss": 0.4725759029388428 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1510898619890213, - "train/contrastive_loss": 1.381009817123413, - "train/negative_loss": 0.5867534279823303, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.7942564487457275, - "train/total_loss": 0.4272918105125427 + "train/classification_loss": 0.22161826491355896, + "train/contrastive_loss": 3.0368266105651855, + "train/negative_loss": 2.989464521408081, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.04736214876174927, + "train/total_loss": 0.8289835453033447 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.18075862526893616, - "train/contrastive_loss": 2.1407604217529297, - "train/negative_loss": 1.2356919050216675, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.905068576335907, - "train/total_loss": 0.6089106798171997 + "train/classification_loss": 0.2155858427286148, + "train/contrastive_loss": 2.4562065601348877, + "train/negative_loss": 2.086688756942749, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.3695177435874939, + "train/total_loss": 0.7068271636962891 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.23400011658668518, - "train/contrastive_loss": 1.3978873491287231, - "train/negative_loss": 1.3202074766159058, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.0776798203587532, - "train/total_loss": 0.5135775804519653 + "train/classification_loss": 0.19224867224693298, + "train/contrastive_loss": 1.82871675491333, + "train/negative_loss": 1.0345207452774048, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.7941960096359253, + "train/total_loss": 0.5579920411109924 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1615360826253891, - "train/contrastive_loss": 1.0852676630020142, - "train/negative_loss": 1.0290656089782715, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.056202035397291183, - "train/total_loss": 0.3785896301269531 + "train/classification_loss": 0.20780417323112488, + "train/contrastive_loss": 1.473059058189392, + "train/negative_loss": 1.4729293584823608, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.000129708118038252, + "train/total_loss": 0.5024160146713257 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.14986009895801544, - "train/contrastive_loss": 1.2430669069290161, - "train/negative_loss": 1.1650848388671875, + "train/classification_loss": 0.11690351366996765, + "train/contrastive_loss": 0.24079112708568573, + "train/negative_loss": 0.1931220442056656, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.07798203825950623, - "train/total_loss": 0.39847350120544434 + "train/positive_loss": 0.04766908288002014, + "train/total_loss": 0.16506174206733704 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.29052045941352844, - "train/contrastive_loss": 2.6619420051574707, - "train/negative_loss": 1.7947604656219482, + "train/classification_loss": 0.23107852041721344, + "train/contrastive_loss": 2.6729283332824707, + "train/negative_loss": 1.9350939989089966, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.867181658744812, - "train/total_loss": 0.822908878326416 + "train/num_positives": 14, + "train/positive_loss": 0.7378343939781189, + "train/total_loss": 0.7656641602516174 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.19971878826618195, - "train/contrastive_loss": 2.484118938446045, - "train/negative_loss": 1.713862419128418, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.7702566385269165, - "train/total_loss": 0.6965425610542297 + "train/classification_loss": 0.16104593873023987, + "train/contrastive_loss": 1.2811723947525024, + "train/negative_loss": 0.9447054862976074, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.336466908454895, + "train/total_loss": 0.4172804355621338 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.11893308907747269, - "train/contrastive_loss": 0.8466957807540894, - "train/negative_loss": 0.3475143611431122, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.49918144941329956, - "train/total_loss": 0.28827226161956787 + "train/classification_loss": 0.1898118257522583, + "train/contrastive_loss": 2.337682008743286, + "train/negative_loss": 2.3365840911865234, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.001097861211746931, + "train/total_loss": 0.6573482751846313 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.22388330101966858, - "train/contrastive_loss": 3.114335060119629, - "train/negative_loss": 1.9729821681976318, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.141352891921997, - "train/total_loss": 0.8467503786087036 + "train/classification_loss": 0.21859918534755707, + "train/contrastive_loss": 3.874910831451416, + "train/negative_loss": 2.375621795654297, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.4992889165878296, + "train/total_loss": 0.9935813546180725 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.13905051350593567, - "train/contrastive_loss": 2.0086660385131836, - "train/negative_loss": 2.002528429031372, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.006137543357908726, - "train/total_loss": 0.5407837629318237 + "train/classification_loss": 0.19474028050899506, + "train/contrastive_loss": 1.2165257930755615, + "train/negative_loss": 0.9295287132263184, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.28699710965156555, + "train/total_loss": 0.4380454421043396 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.14148475229740143, - "train/contrastive_loss": 2.0354971885681152, - "train/negative_loss": 1.280540943145752, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.7549561858177185, - "train/total_loss": 0.5485842227935791 + "train/classification_loss": 0.13938456773757935, + "train/contrastive_loss": 1.7123061418533325, + "train/negative_loss": 0.773226261138916, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9390798807144165, + "train/total_loss": 0.48184579610824585 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.15636850893497467, - "train/contrastive_loss": 0.5206571817398071, - "train/negative_loss": 0.4728316366672516, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.04782555252313614, - "train/total_loss": 0.2604999542236328 + "train/classification_loss": 0.17868198454380035, + "train/contrastive_loss": 1.6806676387786865, + "train/negative_loss": 0.8136024475097656, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.8670651912689209, + "train/total_loss": 0.5148155093193054 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.23993158340454102, - "train/contrastive_loss": 2.7363338470458984, - "train/negative_loss": 1.7949838638305664, - "train/num_negatives": 40, + "train/classification_loss": 0.13712361454963684, + "train/contrastive_loss": 1.727832317352295, + "train/negative_loss": 0.965118944644928, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9413498640060425, - "train/total_loss": 0.7871983647346497 + "train/positive_loss": 0.7627133727073669, + "train/total_loss": 0.48269009590148926 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1826252043247223, - "train/contrastive_loss": 0.8108238577842712, - "train/negative_loss": 0.34674638509750366, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.4640774726867676, - "train/total_loss": 0.344789981842041 + "train/classification_loss": 0.20445416867733002, + "train/contrastive_loss": 1.7956867218017578, + "train/negative_loss": 1.5415583848953247, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.2541283071041107, + "train/total_loss": 0.5635915398597717 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1975785791873932, - "train/contrastive_loss": 1.1125320196151733, - "train/negative_loss": 1.1086567640304565, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0038752290420234203, - "train/total_loss": 0.42008498311042786 + "train/classification_loss": 0.17574962973594666, + "train/contrastive_loss": 0.7344685196876526, + "train/negative_loss": 0.7213791012763977, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.013089398853480816, + "train/total_loss": 0.32264333963394165 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.16182057559490204, - "train/contrastive_loss": 2.69752836227417, - "train/negative_loss": 1.3694905042648315, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.3280378580093384, - "train/total_loss": 0.7013262510299683 + "train/classification_loss": 0.1970960795879364, + "train/contrastive_loss": 3.4482498168945312, + "train/negative_loss": 1.6692242622375488, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.7790255546569824, + "train/total_loss": 0.8867460489273071 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.25060588121414185, - "train/contrastive_loss": 1.809828758239746, - "train/negative_loss": 0.627274215221405, - "train/num_negatives": 44, + "train/classification_loss": 0.15910790860652924, + "train/contrastive_loss": 2.4080164432525635, + "train/negative_loss": 2.366711139678955, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.1825544834136963, - "train/total_loss": 0.6125715970993042 + "train/positive_loss": 0.04130534082651138, + "train/total_loss": 0.6407111883163452 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.26068177819252014, - "train/contrastive_loss": 2.2497401237487793, - "train/negative_loss": 1.7352186441421509, - "train/num_negatives": 44, + "train/classification_loss": 0.1344788819551468, + "train/contrastive_loss": 2.969633102416992, + "train/negative_loss": 2.035134792327881, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.5145214796066284, - "train/total_loss": 0.7106298208236694 + "train/positive_loss": 0.9344983100891113, + "train/total_loss": 0.7284054756164551 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.14321886003017426, - "train/contrastive_loss": 1.933957576751709, - "train/negative_loss": 0.6470386385917664, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.2869188785552979, - "train/total_loss": 0.5300104022026062 + "train/classification_loss": 0.18802078068256378, + "train/contrastive_loss": 3.068547487258911, + "train/negative_loss": 2.0661990642547607, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.0023484230041504, + "train/total_loss": 0.8017302751541138 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.13916918635368347, - "train/contrastive_loss": 0.38205021619796753, - "train/negative_loss": 0.14382590353488922, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.23822429776191711, - "train/total_loss": 0.21557924151420593 + "train/classification_loss": 0.2385285645723343, + "train/contrastive_loss": 3.411303758621216, + "train/negative_loss": 1.678453803062439, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.7328499555587769, + "train/total_loss": 0.9207893013954163 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.11141932755708694, - "train/contrastive_loss": 0.6793302893638611, - "train/negative_loss": 0.3044567406177521, + "train/classification_loss": 0.17487332224845886, + "train/contrastive_loss": 1.6150904893875122, + "train/negative_loss": 0.6004703044891357, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.374873548746109, - "train/total_loss": 0.247285395860672 + "train/num_positives": 10, + "train/positive_loss": 1.0146201848983765, + "train/total_loss": 0.4978914260864258 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.26875388622283936, - "train/contrastive_loss": 1.575418472290039, - "train/negative_loss": 0.17127986252307892, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.4041385650634766, - "train/total_loss": 0.583837628364563 + "train/classification_loss": 0.2230340838432312, + "train/contrastive_loss": 3.04897141456604, + "train/negative_loss": 2.6776747703552246, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.37129664421081543, + "train/total_loss": 0.8328284025192261 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2528129518032074, - "train/contrastive_loss": 3.153428554534912, - "train/negative_loss": 1.6320233345031738, + "train/classification_loss": 0.20771414041519165, + "train/contrastive_loss": 1.9516738653182983, + "train/negative_loss": 1.9042127132415771, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5214052200317383, - "train/total_loss": 0.8834986686706543 + "train/num_positives": 4, + "train/positive_loss": 0.0474611259996891, + "train/total_loss": 0.5980489253997803 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.19132502377033234, - "train/contrastive_loss": 2.3682749271392822, - "train/negative_loss": 1.9646615982055664, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.40361326932907104, - "train/total_loss": 0.6649799942970276 + "train/classification_loss": 0.19842027127742767, + "train/contrastive_loss": 0.6385742425918579, + "train/negative_loss": 0.5296170711517334, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.10895716398954391, + "train/total_loss": 0.32613512873649597 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2008475959300995, - "train/contrastive_loss": 1.2457764148712158, - "train/negative_loss": 0.6553623676300049, - "train/num_negatives": 40, + "train/classification_loss": 0.2546830475330353, + "train/contrastive_loss": 3.3375473022460938, + "train/negative_loss": 1.7217724323272705, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.5904139876365662, - "train/total_loss": 0.45000287890434265 - }, - { - "epoch": 7.224334600760456, - "step": 1900, - "train/classification_loss": 0.2201923429965973, - "train/contrastive_loss": 1.7136672735214233, - "train/negative_loss": 1.4705090522766113, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2431582510471344, - "train/total_loss": 0.5629258155822754 - }, - { - "epoch": 7.224334600760456, - "step": 1900, - "train/classification_loss": 0.1529267132282257, - "train/contrastive_loss": 0.6145889163017273, - "train/negative_loss": 0.24079373478889465, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.37379518151283264, - "train/total_loss": 0.2758445143699646 + "train/positive_loss": 1.6157747507095337, + "train/total_loss": 0.9221925735473633 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2378939688205719, - "train/contrastive_loss": 3.438408374786377, - "train/negative_loss": 1.9361172914505005, + "train/classification_loss": 0.22745093703269958, + "train/contrastive_loss": 1.483272910118103, + "train/negative_loss": 1.4721198081970215, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.502290964126587, - "train/total_loss": 0.9255756139755249 + "train/num_positives": 10, + "train/positive_loss": 0.011153125204145908, + "train/total_loss": 0.5241055488586426 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2722857892513275, - "train/contrastive_loss": 1.1518443822860718, - "train/negative_loss": 1.1510798931121826, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007645429577678442, - "train/total_loss": 0.5026546716690063 + "train/classification_loss": 0.1658446192741394, + "train/contrastive_loss": 1.7293444871902466, + "train/negative_loss": 1.7292804718017578, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 6.39890058664605e-05, + "train/total_loss": 0.5117135047912598 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.210185244679451, - "train/contrastive_loss": 2.0761258602142334, - "train/negative_loss": 1.0823867321014404, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.993739128112793, - "train/total_loss": 0.6254104375839233 + "train/classification_loss": 0.1772678792476654, + "train/contrastive_loss": 2.528303861618042, + "train/negative_loss": 1.8653534650802612, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.662950336933136, + "train/total_loss": 0.6829286813735962 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2001577764749527, - "train/contrastive_loss": 2.517183303833008, - "train/negative_loss": 1.9847521781921387, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5324310064315796, - "train/total_loss": 0.703594446182251 + "train/classification_loss": 0.19365540146827698, + "train/contrastive_loss": 1.9069876670837402, + "train/negative_loss": 1.4431899785995483, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.4637976586818695, + "train/total_loss": 0.5750529766082764 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.17754627764225006, - "train/contrastive_loss": 3.99332857131958, - "train/negative_loss": 1.4673980474472046, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.525930643081665, - "train/total_loss": 0.9762119650840759 + "train/classification_loss": 0.21822020411491394, + "train/contrastive_loss": 2.259861469268799, + "train/negative_loss": 1.7424304485321045, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.5174309611320496, + "train/total_loss": 0.6701924800872803 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1642834097146988, - "train/contrastive_loss": 1.0820200443267822, - "train/negative_loss": 0.6744377017021179, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.4075823128223419, - "train/total_loss": 0.380687415599823 + "train/classification_loss": 0.2339928299188614, + "train/contrastive_loss": 1.7953006029129028, + "train/negative_loss": 1.2796703577041626, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5156302452087402, + "train/total_loss": 0.5930529832839966 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1880195289850235, - "train/contrastive_loss": 1.0751765966415405, - "train/negative_loss": 1.0159794092178345, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.059197232127189636, - "train/total_loss": 0.4030548334121704 + "train/classification_loss": 0.14385662972927094, + "train/contrastive_loss": 1.7576894760131836, + "train/negative_loss": 1.757625937461853, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 6.35528631391935e-05, + "train/total_loss": 0.4953945279121399 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.20186151564121246, - "train/contrastive_loss": 1.4653698205947876, - "train/negative_loss": 1.3361455202102661, + "train/classification_loss": 0.21224145591259003, + "train/contrastive_loss": 0.9677494168281555, + "train/negative_loss": 0.7769870162010193, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.12922434508800507, - "train/total_loss": 0.4949355125427246 + "train/positive_loss": 0.19076238572597504, + "train/total_loss": 0.40579134225845337 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.20118412375450134, - "train/contrastive_loss": 1.845171332359314, - "train/negative_loss": 1.805213451385498, + "train/classification_loss": 0.26073524355888367, + "train/contrastive_loss": 2.4725046157836914, + "train/negative_loss": 1.906913161277771, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.56559157371521, + "train/total_loss": 0.7552361488342285 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.20143432915210724, + "train/contrastive_loss": 0.35213300585746765, + "train/negative_loss": 0.32196640968322754, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.030166584998369217, + "train/total_loss": 0.27186092734336853 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.2922963500022888, + "train/contrastive_loss": 3.730564832687378, + "train/negative_loss": 2.024803876876831, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 1.7057609558105469, + "train/total_loss": 1.0384093523025513 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.14334173500537872, + "train/contrastive_loss": 1.0197844505310059, + "train/negative_loss": 0.7755264639854431, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.03995787352323532, - "train/total_loss": 0.5702183842658997 + "train/num_positives": 10, + "train/positive_loss": 0.24425797164440155, + "train/total_loss": 0.34729862213134766 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.16851532459259033, + "train/contrastive_loss": 1.9482519626617432, + "train/negative_loss": 1.5255510807037354, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4227008521556854, + "train/total_loss": 0.5581657290458679 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.1941116750240326, + "train/contrastive_loss": 1.0349037647247314, + "train/negative_loss": 1.0348531007766724, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 5.060583498561755e-05, + "train/total_loss": 0.40109241008758545 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.17741942405700684, - "train/contrastive_loss": 1.0716540813446045, - "train/negative_loss": 0.9175702929496765, + "train/classification_loss": 0.251036137342453, + "train/contrastive_loss": 1.2935383319854736, + "train/negative_loss": 1.2841545343399048, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.15408380329608917, - "train/total_loss": 0.3917502462863922 + "train/positive_loss": 0.009383788332343102, + "train/total_loss": 0.5097438097000122 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.20031604170799255, - "train/contrastive_loss": 2.827211856842041, - "train/negative_loss": 2.2385547161102295, - "train/num_negatives": 36, + "train/classification_loss": 0.19396381080150604, + "train/contrastive_loss": 1.0589491128921509, + "train/negative_loss": 1.0146514177322388, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.044297702610492706, + "train/total_loss": 0.40575364232063293 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.3197799026966095, + "train/contrastive_loss": 2.846153736114502, + "train/negative_loss": 1.9570695161819458, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.5886572003364563, - "train/total_loss": 0.7657583951950073 + "train/positive_loss": 0.8890842795372009, + "train/total_loss": 0.8890106678009033 + }, + { + "epoch": 6.690140845070422, + "step": 1900, + "train/classification_loss": 0.17094211280345917, + "train/contrastive_loss": 1.5236997604370117, + "train/negative_loss": 1.1987823247909546, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.32491737604141235, + "train/total_loss": 0.4756820797920227 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.22783654928207397, - "train/contrastive_loss": 0.7710169553756714, - "train/negative_loss": 0.37993574142456055, + "train/classification_loss": 0.19952167570590973, + "train/contrastive_loss": 2.54634952545166, + "train/negative_loss": 2.0986878871917725, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.39108118414878845, - "train/total_loss": 0.38203996419906616 + "train/num_positives": 14, + "train/positive_loss": 0.44766175746917725, + "train/total_loss": 0.7087915539741516 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.16931910812854767, - "train/contrastive_loss": 2.2249300479888916, - "train/negative_loss": 1.3033899068832397, + "train/classification_loss": 0.2637220621109009, + "train/contrastive_loss": 3.4194865226745605, + "train/negative_loss": 3.419389247894287, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.9215401411056519, - "train/total_loss": 0.6143051385879517 + "train/num_positives": 2, + "train/positive_loss": 9.716029308037832e-05, + "train/total_loss": 0.9476193785667419 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.14516431093215942, - "train/contrastive_loss": 1.6941709518432617, - "train/negative_loss": 0.9295675158500671, + "train/classification_loss": 0.18567171692848206, + "train/contrastive_loss": 1.8019644021987915, + "train/negative_loss": 0.8965386748313904, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.7646033763885498, - "train/total_loss": 0.48399850726127625 + "train/num_positives": 16, + "train/positive_loss": 0.9054257273674011, + "train/total_loss": 0.5460646152496338 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2947947084903717, - "train/contrastive_loss": 1.736924171447754, - "train/negative_loss": 1.3492668867111206, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.3876572549343109, - "train/total_loss": 0.642179548740387 + "train/classification_loss": 0.14846765995025635, + "train/contrastive_loss": 0.3383611738681793, + "train/negative_loss": 0.2893919348716736, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.04896923899650574, + "train/total_loss": 0.21613989770412445 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.113642118871212, - "train/contrastive_loss": 0.21493473649024963, - "train/negative_loss": 0.21489816904067993, - "train/num_negatives": 48, + "train/classification_loss": 0.2143513411283493, + "train/contrastive_loss": 0.8977898359298706, + "train/negative_loss": 0.7769964337348938, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 3.6568904761224985e-05, - "train/total_loss": 0.1566290706396103 + "train/positive_loss": 0.1207934021949768, + "train/total_loss": 0.3939093053340912 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.16848988831043243, - "train/contrastive_loss": 0.8080705404281616, - "train/negative_loss": 0.3000565469264984, + "train/classification_loss": 0.20978379249572754, + "train/contrastive_loss": 0.9033424854278564, + "train/negative_loss": 0.879086971282959, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.5080139636993408, - "train/total_loss": 0.3301039934158325 + "train/num_positives": 14, + "train/positive_loss": 0.024255530908703804, + "train/total_loss": 0.3904522955417633 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1185910552740097, - "train/contrastive_loss": 0.584959089756012, - "train/negative_loss": 0.5501630306243896, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.03479604050517082, - "train/total_loss": 0.2355828732252121 + "train/classification_loss": 0.2949010133743286, + "train/contrastive_loss": 2.775782585144043, + "train/negative_loss": 1.5411112308502197, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.2346712350845337, + "train/total_loss": 0.8500575423240662 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2083611935377121, - "train/contrastive_loss": 0.7933493256568909, - "train/negative_loss": 0.740670919418335, - "train/num_negatives": 28, + "train/classification_loss": 0.1392522156238556, + "train/contrastive_loss": 0.5150004625320435, + "train/negative_loss": 0.3977017104625702, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.05267840623855591, - "train/total_loss": 0.367031067609787 + "train/positive_loss": 0.11729878187179565, + "train/total_loss": 0.24225232005119324 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.16460934281349182, - "train/contrastive_loss": 1.7578182220458984, - "train/negative_loss": 0.7742782235145569, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9835400581359863, - "train/total_loss": 0.5161730051040649 + "train/classification_loss": 0.1353110373020172, + "train/contrastive_loss": 0.6411240100860596, + "train/negative_loss": 0.3942115008831024, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.24691250920295715, + "train/total_loss": 0.26353585720062256 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.15848402678966522, - "train/contrastive_loss": 0.3644297122955322, - "train/negative_loss": 0.36417528986930847, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00025440845638513565, - "train/total_loss": 0.2313699722290039 + "train/classification_loss": 0.16366037726402283, + "train/contrastive_loss": 0.9654884338378906, + "train/negative_loss": 0.8125596046447754, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.15292885899543762, + "train/total_loss": 0.3567580580711365 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.20275916159152985, - "train/contrastive_loss": 2.957404851913452, - "train/negative_loss": 1.3066281080245972, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.650776743888855, - "train/total_loss": 0.7942401170730591 + "train/classification_loss": 0.21263548731803894, + "train/contrastive_loss": 3.341897964477539, + "train/negative_loss": 1.6389883756637573, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.7029095888137817, + "train/total_loss": 0.8810150623321533 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.22495000064373016, - "train/contrastive_loss": 2.602616786956787, - "train/negative_loss": 1.8647745847702026, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7378420829772949, - "train/total_loss": 0.7454733848571777 + "train/classification_loss": 0.20965367555618286, + "train/contrastive_loss": 1.287813425064087, + "train/negative_loss": 0.9864407777786255, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3013727068901062, + "train/total_loss": 0.4672163724899292 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.19474181532859802, - "train/contrastive_loss": 1.4715299606323242, - "train/negative_loss": 0.5788039565086365, + "train/classification_loss": 0.12619730830192566, + "train/contrastive_loss": 0.20683008432388306, + "train/negative_loss": 0.18669262528419495, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8927260637283325, - "train/total_loss": 0.4890478253364563 + "train/num_positives": 16, + "train/positive_loss": 0.020137455314397812, + "train/total_loss": 0.1675633192062378 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.15915730595588684, - "train/contrastive_loss": 2.7397236824035645, - "train/negative_loss": 1.4792815446853638, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2604420185089111, - "train/total_loss": 0.7071020603179932 + "train/classification_loss": 0.1951521784067154, + "train/contrastive_loss": 2.7269630432128906, + "train/negative_loss": 1.184470772743225, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.5424922704696655, + "train/total_loss": 0.7405447959899902 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.24516554176807404, - "train/contrastive_loss": 4.227482795715332, - "train/negative_loss": 1.431012511253357, + "train/classification_loss": 0.27544525265693665, + "train/contrastive_loss": 2.3511710166931152, + "train/negative_loss": 1.8781392574310303, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.7964701652526855, - "train/total_loss": 1.0906621217727661 + "train/num_positives": 2, + "train/positive_loss": 0.47303175926208496, + "train/total_loss": 0.745679497718811 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.216152161359787, - "train/contrastive_loss": 2.927096366882324, - "train/negative_loss": 1.6010522842407227, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.326043963432312, - "train/total_loss": 0.8015714883804321 + "train/classification_loss": 0.13615156710147858, + "train/contrastive_loss": 2.0564262866973877, + "train/negative_loss": 1.1554896831512451, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9009365439414978, + "train/total_loss": 0.5474368333816528 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1812569946050644, - "train/contrastive_loss": 2.3428733348846436, - "train/negative_loss": 1.4339426755905151, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.9089307188987732, - "train/total_loss": 0.6498316526412964 + "train/classification_loss": 0.19944772124290466, + "train/contrastive_loss": 1.4613717794418335, + "train/negative_loss": 0.9308468103408813, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.5305249691009521, + "train/total_loss": 0.49172207713127136 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.20488488674163818, - "train/contrastive_loss": 2.9946796894073486, - "train/negative_loss": 1.6998493671417236, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.294830322265625, - "train/total_loss": 0.8038208484649658 + "train/classification_loss": 0.19426573812961578, + "train/contrastive_loss": 0.9899672269821167, + "train/negative_loss": 0.6158229112625122, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.3741443455219269, + "train/total_loss": 0.3922591805458069 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2248542755842209, - "train/contrastive_loss": 3.059823989868164, - "train/negative_loss": 1.9666022062301636, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.093221664428711, - "train/total_loss": 0.8368191123008728 + "train/classification_loss": 0.19476650655269623, + "train/contrastive_loss": 4.197413921356201, + "train/negative_loss": 4.197410583496094, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 3.564370445019449e-06, + "train/total_loss": 1.0342493057250977 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.24216416478157043, - "train/contrastive_loss": 2.35111141204834, - "train/negative_loss": 1.4901659488677979, + "train/classification_loss": 0.18569374084472656, + "train/contrastive_loss": 0.9398561716079712, + "train/negative_loss": 0.44885239005088806, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.8609453439712524, - "train/total_loss": 0.7123864889144897 + "train/positive_loss": 0.4910038113594055, + "train/total_loss": 0.3736649751663208 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1817237287759781, - "train/contrastive_loss": 0.6771752238273621, - "train/negative_loss": 0.6745142340660095, + "train/classification_loss": 0.21243086457252502, + "train/contrastive_loss": 1.806515097618103, + "train/negative_loss": 1.6013031005859375, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0026609888300299644, - "train/total_loss": 0.3171587586402893 + "train/num_positives": 8, + "train/positive_loss": 0.20521198213100433, + "train/total_loss": 0.573733925819397 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.17729176580905914, - "train/contrastive_loss": 1.5463391542434692, - "train/negative_loss": 0.6096402406692505, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9366989135742188, - "train/total_loss": 0.4865596294403076 + "train/classification_loss": 0.1697894185781479, + "train/contrastive_loss": 2.1891608238220215, + "train/negative_loss": 1.155372142791748, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0337885618209839, + "train/total_loss": 0.6076216101646423 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.1682153046131134, - "train/contrastive_loss": 1.3778948783874512, - "train/negative_loss": 0.48077836632728577, - "train/num_negatives": 46, + "train/classification_loss": 0.26295313239097595, + "train/contrastive_loss": 2.4246573448181152, + "train/negative_loss": 2.173088312149048, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.8971165418624878, - "train/total_loss": 0.44379428029060364 + "train/positive_loss": 0.25156909227371216, + "train/total_loss": 0.7478846311569214 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.2370443493127823, - "train/contrastive_loss": 1.6158963441848755, - "train/negative_loss": 1.6158963441848755, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5602236390113831 - }, - { - "epoch": 7.224334600760456, - "eval_exact_match_accuracy": 0.22666666666666666, - "eval_hamming_loss": 0.07204481792717086, - "eval_loss": 0.5601001977920532, - "eval_macro_f1": 0.21023296002791764, - "eval_macro_precision": 0.5093390822144054, - "eval_macro_recall": 0.15440273376574337, - "eval_micro_f1": 0.47338247338247336, - "eval_micro_precision": 0.8450292397660819, - "eval_micro_recall": 0.32878270762229805, - "eval_runtime": 2.6241, - "eval_samples_per_second": 200.067, - "eval_steps_per_second": 25.151, + "train/classification_loss": 0.2108353227376938, + "train/contrastive_loss": 2.371546506881714, + "train/negative_loss": 1.8840951919555664, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.48745131492614746, + "train/total_loss": 0.6851446032524109 + }, + { + "epoch": 6.690140845070422, + "eval_exact_match_accuracy": 0.23985890652557318, + "eval_hamming_loss": 0.07199917003838573, + "eval_loss": 0.5858319997787476, + "eval_macro_f1": 0.23369980164035162, + "eval_macro_precision": 0.3577172514594292, + "eval_macro_recall": 0.18727694783923346, + "eval_micro_f1": 0.4766214177978884, + "eval_micro_precision": 0.8144329896907216, + "eval_micro_recall": 0.3368869936034115, + "eval_runtime": 2.8614, + "eval_samples_per_second": 198.153, + "eval_steps_per_second": 24.813, "step": 1900 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.14963044226169586, - "train/contrastive_loss": 0.8808765411376953, - "train/negative_loss": 0.4277215301990509, - "train/num_negatives": 30, - "train/num_positives": 26, - "train/positive_loss": 0.4531550109386444, - "train/total_loss": 0.32580575346946716 + "train/classification_loss": 0.1914425790309906, + "train/contrastive_loss": 0.9861552715301514, + "train/negative_loss": 0.7161850333213806, + "train/num_negatives": 34, + "train/num_positives": 8, + "train/positive_loss": 0.26997020840644836, + "train/total_loss": 0.3886736333370209 }, { - "epoch": 7.224334600760456, + "epoch": 6.690140845070422, "step": 1900, - "train/classification_loss": 0.21229328215122223, - "train/contrastive_loss": 0.7890034317970276, - "train/negative_loss": 0.7614498138427734, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.027553638443350792, - "train/total_loss": 0.37009397149086 + "train/classification_loss": 0.1036413162946701, + "train/contrastive_loss": 0.8758577108383179, + "train/negative_loss": 0.7414747476577759, + "train/num_negatives": 14, + "train/num_positives": 42, + "train/positive_loss": 0.13438299298286438, + "train/total_loss": 0.27881285548210144 }, { - "epoch": 7.414448669201521, - "grad_norm": 13.29869270324707, - "learning_rate": 1.971887366818874e-05, - "loss": 0.7761, + "epoch": 6.866197183098592, + "grad_norm": 12.582423210144043, + "learning_rate": 1.9739816772374912e-05, + "loss": 0.8348, "step": 1950 }, { - "epoch": 7.414448669201521, + "epoch": 6.866197183098592, "step": 1950, - "train/classification_loss": 0.16173161566257477, - "train/contrastive_loss": 0.7327642440795898, - "train/negative_loss": 0.6514501571655273, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0813140869140625, - "train/total_loss": 0.3082844614982605 + "train/classification_loss": 0.16489115357398987, + "train/contrastive_loss": 1.159151315689087, + "train/negative_loss": 0.5638828277587891, + "train/num_negatives": 44, + "train/num_positives": 10, + "train/positive_loss": 0.5952684283256531, + "train/total_loss": 0.39672142267227173 }, { - "epoch": 7.414448669201521, + "epoch": 6.866197183098592, "step": 1950, - "train/classification_loss": 0.1634564995765686, - "train/contrastive_loss": 1.0687999725341797, - "train/negative_loss": 0.7888278365135193, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.2799721360206604, - "train/total_loss": 0.37721651792526245 + "train/classification_loss": 0.1773223578929901, + "train/contrastive_loss": 1.3071624040603638, + "train/negative_loss": 0.7744905352592468, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.5326718688011169, + "train/total_loss": 0.4387548565864563 }, { - "epoch": 7.604562737642586, - "grad_norm": 10.397614479064941, - "learning_rate": 1.9711263318112633e-05, - "loss": 0.7541, + "epoch": 7.042253521126761, + "grad_norm": 20.763103485107422, + "learning_rate": 1.973276955602537e-05, + "loss": 0.812, "step": 2000 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.25760364532470703, - "train/contrastive_loss": 1.5996177196502686, - "train/negative_loss": 0.5334265828132629, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.0661911964416504, - "train/total_loss": 0.5775271654129028 + "train/classification_loss": 0.2362351417541504, + "train/contrastive_loss": 1.8519260883331299, + "train/negative_loss": 1.4278429746627808, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.42408308386802673, + "train/total_loss": 0.6066203713417053 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.21227966248989105, - "train/contrastive_loss": 1.4870281219482422, - "train/negative_loss": 1.0446085929870605, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.44241952896118164, - "train/total_loss": 0.5096852779388428 + "train/classification_loss": 0.24857378005981445, + "train/contrastive_loss": 1.9192769527435303, + "train/negative_loss": 0.5345038771629333, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.3847731351852417, + "train/total_loss": 0.6324291825294495 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16029950976371765, - "train/contrastive_loss": 1.9429798126220703, - "train/negative_loss": 0.6662464737892151, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.2767333984375, - "train/total_loss": 0.5488954782485962 + "train/classification_loss": 0.2557935118675232, + "train/contrastive_loss": 2.0504822731018066, + "train/negative_loss": 1.2515318393707275, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.7989503741264343, + "train/total_loss": 0.6658899784088135 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.18443091213703156, - "train/contrastive_loss": 2.7816567420959473, - "train/negative_loss": 1.6894618272781372, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.0921950340270996, - "train/total_loss": 0.7407622337341309 + "train/classification_loss": 0.13967962563037872, + "train/contrastive_loss": 1.2220646142959595, + "train/negative_loss": 0.49229907989501953, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.7297655344009399, + "train/total_loss": 0.3840925693511963 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.14715616405010223, - "train/contrastive_loss": 1.7735682725906372, - "train/negative_loss": 1.702828049659729, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.0707402229309082, - "train/total_loss": 0.501869797706604 + "train/classification_loss": 0.21881839632987976, + "train/contrastive_loss": 2.4377989768981934, + "train/negative_loss": 2.1648924350738525, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.272906631231308, + "train/total_loss": 0.7063782215118408 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.17605924606323242, - "train/contrastive_loss": 1.9468157291412354, - "train/negative_loss": 1.5541973114013672, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.39261841773986816, - "train/total_loss": 0.5654224157333374 + "train/classification_loss": 0.20519232749938965, + "train/contrastive_loss": 2.113013744354248, + "train/negative_loss": 1.5762704610824585, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.5367433428764343, + "train/total_loss": 0.6277951002120972 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.22183391451835632, - "train/contrastive_loss": 1.3343843221664429, - "train/negative_loss": 1.1058834791183472, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.22850081324577332, - "train/total_loss": 0.48871079087257385 + "train/classification_loss": 0.2447187751531601, + "train/contrastive_loss": 2.3133597373962402, + "train/negative_loss": 1.4129846096038818, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9003751277923584, + "train/total_loss": 0.7073907256126404 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16443677246570587, - "train/contrastive_loss": 1.9178416728973389, - "train/negative_loss": 1.3420844078063965, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5757573246955872, - "train/total_loss": 0.5480051040649414 + "train/classification_loss": 0.20461270213127136, + "train/contrastive_loss": 1.3597595691680908, + "train/negative_loss": 1.3584171533584595, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0013423627242445946, + "train/total_loss": 0.4765646159648895 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.15371112525463104, - "train/contrastive_loss": 1.0821201801300049, - "train/negative_loss": 1.0433807373046875, + "train/classification_loss": 0.11606776714324951, + "train/contrastive_loss": 0.7776416540145874, + "train/negative_loss": 0.17869257926940918, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.038739386945962906, - "train/total_loss": 0.3701351583003998 + "train/positive_loss": 0.5989490747451782, + "train/total_loss": 0.27159610390663147 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.3127135634422302, - "train/contrastive_loss": 3.349125385284424, - "train/negative_loss": 1.7698719501495361, + "train/classification_loss": 0.20091688632965088, + "train/contrastive_loss": 1.4774000644683838, + "train/negative_loss": 0.8960364460945129, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.5792533159255981, - "train/total_loss": 0.982538640499115 + "train/num_positives": 14, + "train/positive_loss": 0.5813636183738708, + "train/total_loss": 0.49639689922332764 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.2044217884540558, - "train/contrastive_loss": 2.3104734420776367, - "train/negative_loss": 1.6196720600128174, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6908013224601746, - "train/total_loss": 0.6665164828300476 + "train/classification_loss": 0.1626138538122177, + "train/contrastive_loss": 2.7368881702423096, + "train/negative_loss": 0.7150574326515198, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 2.0218307971954346, + "train/total_loss": 0.7099915146827698 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.12838655710220337, - "train/contrastive_loss": 1.3005011081695557, - "train/negative_loss": 0.6207240223884583, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.6797771453857422, - "train/total_loss": 0.38848677277565 + "train/classification_loss": 0.18105195462703705, + "train/contrastive_loss": 1.9752154350280762, + "train/negative_loss": 0.9806166887283325, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.9945988059043884, + "train/total_loss": 0.5760950446128845 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.22150970995426178, - "train/contrastive_loss": 2.4545466899871826, - "train/negative_loss": 2.1371853351593018, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.3173612952232361, - "train/total_loss": 0.7124190330505371 + "train/classification_loss": 0.21323104202747345, + "train/contrastive_loss": 4.088104248046875, + "train/negative_loss": 2.310882091522217, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.7772222757339478, + "train/total_loss": 1.03085196018219 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.14342333376407623, - "train/contrastive_loss": 2.603027582168579, - "train/negative_loss": 2.5929176807403564, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.010109840892255306, - "train/total_loss": 0.6640288233757019 + "train/classification_loss": 0.20089012384414673, + "train/contrastive_loss": 0.9459574222564697, + "train/negative_loss": 0.9221904873847961, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.023766906931996346, + "train/total_loss": 0.39008161425590515 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.13493017852306366, - "train/contrastive_loss": 1.8221955299377441, - "train/negative_loss": 1.6820231676101685, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.14017239212989807, - "train/total_loss": 0.4993692636489868 + "train/classification_loss": 0.1529805064201355, + "train/contrastive_loss": 2.7501914501190186, + "train/negative_loss": 0.7597729563713074, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.9904184341430664, + "train/total_loss": 0.7030187845230103 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1518411636352539, - "train/contrastive_loss": 0.5060108304023743, - "train/negative_loss": 0.4964960217475891, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.00951483566313982, - "train/total_loss": 0.2530433237552643 + "train/classification_loss": 0.1842104196548462, + "train/contrastive_loss": 1.3468527793884277, + "train/negative_loss": 0.7031615376472473, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.6436912417411804, + "train/total_loss": 0.45358097553253174 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.23082436621189117, - "train/contrastive_loss": 2.0391952991485596, - "train/negative_loss": 1.3553224802017212, - "train/num_negatives": 40, + "train/classification_loss": 0.15590372681617737, + "train/contrastive_loss": 1.2907254695892334, + "train/negative_loss": 0.5921145677566528, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.6838728785514832, - "train/total_loss": 0.6386634111404419 + "train/positive_loss": 0.6986109018325806, + "train/total_loss": 0.41404882073402405 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16953381896018982, - "train/contrastive_loss": 0.6273353695869446, - "train/negative_loss": 0.2779753804206848, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.34935998916625977, - "train/total_loss": 0.29500091075897217 + "train/classification_loss": 0.21427588164806366, + "train/contrastive_loss": 2.122995376586914, + "train/negative_loss": 1.0316722393035889, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.0913230180740356, + "train/total_loss": 0.6388749480247498 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.19932444393634796, - "train/contrastive_loss": 1.2405918836593628, - "train/negative_loss": 1.2400827407836914, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0005091738421469927, - "train/total_loss": 0.44744282960891724 + "train/classification_loss": 0.17009508609771729, + "train/contrastive_loss": 2.3069941997528076, + "train/negative_loss": 0.44117772579193115, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 1.8658164739608765, + "train/total_loss": 0.6314939260482788 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16035506129264832, - "train/contrastive_loss": 2.5977165699005127, - "train/negative_loss": 2.063074827194214, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.534641683101654, - "train/total_loss": 0.6798983812332153 + "train/classification_loss": 0.19829769432544708, + "train/contrastive_loss": 3.1649794578552246, + "train/negative_loss": 1.2711479663848877, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.893831491470337, + "train/total_loss": 0.8312935829162598 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.24354861676692963, - "train/contrastive_loss": 1.9360108375549316, - "train/negative_loss": 0.6013937592506409, - "train/num_negatives": 44, + "train/classification_loss": 0.15294112265110016, + "train/contrastive_loss": 1.5679103136062622, + "train/negative_loss": 1.4811872243881226, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.334617018699646, - "train/total_loss": 0.6307507753372192 + "train/positive_loss": 0.08672310411930084, + "train/total_loss": 0.4665231704711914 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.265688419342041, - "train/contrastive_loss": 2.2388620376586914, - "train/negative_loss": 1.6326713562011719, - "train/num_negatives": 44, + "train/classification_loss": 0.1360597163438797, + "train/contrastive_loss": 2.8801255226135254, + "train/negative_loss": 1.8268636465072632, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.60619056224823, - "train/total_loss": 0.7134608030319214 + "train/positive_loss": 1.0532619953155518, + "train/total_loss": 0.7120848298072815 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.14194628596305847, - "train/contrastive_loss": 1.3342111110687256, - "train/negative_loss": 0.3991124629974365, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9350985884666443, - "train/total_loss": 0.4087885022163391 + "train/classification_loss": 0.17827272415161133, + "train/contrastive_loss": 1.3183475732803345, + "train/negative_loss": 1.082555890083313, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.23579168319702148, + "train/total_loss": 0.4419422447681427 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1379009634256363, - "train/contrastive_loss": 0.38181203603744507, - "train/negative_loss": 0.1820473074913025, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.19976471364498138, - "train/total_loss": 0.21426337957382202 + "train/classification_loss": 0.23059043288230896, + "train/contrastive_loss": 2.581986427307129, + "train/negative_loss": 1.0841857194900513, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.4978007078170776, + "train/total_loss": 0.7469877004623413 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.11187899857759476, - "train/contrastive_loss": 1.019776463508606, - "train/negative_loss": 0.9016225934028625, + "train/classification_loss": 0.1846114695072174, + "train/contrastive_loss": 2.9019343852996826, + "train/negative_loss": 0.7159580588340759, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.11815386265516281, - "train/total_loss": 0.31583428382873535 + "train/num_positives": 10, + "train/positive_loss": 2.185976266860962, + "train/total_loss": 0.7649983167648315 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.2533835768699646, - "train/contrastive_loss": 1.0039386749267578, - "train/negative_loss": 0.1792580485343933, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.8246806859970093, - "train/total_loss": 0.4541712999343872 + "train/classification_loss": 0.2163945436477661, + "train/contrastive_loss": 2.67317795753479, + "train/negative_loss": 2.2118775844573975, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.46130040287971497, + "train/total_loss": 0.7510301470756531 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.26547789573669434, - "train/contrastive_loss": 2.5931267738342285, - "train/negative_loss": 1.40211820602417, + "train/classification_loss": 0.18990576267242432, + "train/contrastive_loss": 1.328331470489502, + "train/negative_loss": 1.2516578435897827, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1910085678100586, - "train/total_loss": 0.784103274345398 + "train/num_positives": 4, + "train/positive_loss": 0.07667367160320282, + "train/total_loss": 0.45557206869125366 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.18228618800640106, - "train/contrastive_loss": 2.0619115829467773, - "train/negative_loss": 1.976146936416626, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.08576452732086182, - "train/total_loss": 0.5946685075759888 + "train/classification_loss": 0.19577154517173767, + "train/contrastive_loss": 0.4446567893028259, + "train/negative_loss": 0.31728339195251465, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.12737338244915009, + "train/total_loss": 0.2847028970718384 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20130515098571777, - "train/contrastive_loss": 0.9039791822433472, - "train/negative_loss": 0.7096244692802429, - "train/num_negatives": 40, + "train/classification_loss": 0.2638605833053589, + "train/contrastive_loss": 3.8089709281921387, + "train/negative_loss": 1.8787500858306885, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.19435469806194305, - "train/total_loss": 0.38210099935531616 - }, - { - "epoch": 7.604562737642586, - "step": 2000, - "train/classification_loss": 0.2225930243730545, - "train/contrastive_loss": 1.843961477279663, - "train/negative_loss": 1.6039674282073975, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2399941086769104, - "train/total_loss": 0.5913853049278259 - }, - { - "epoch": 7.604562737642586, - "step": 2000, - "train/classification_loss": 0.1393265426158905, - "train/contrastive_loss": 1.2521319389343262, - "train/negative_loss": 0.7101022005081177, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5420296788215637, - "train/total_loss": 0.38975292444229126 + "train/positive_loss": 1.9302209615707397, + "train/total_loss": 1.0256547927856445 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.23149627447128296, - "train/contrastive_loss": 2.1842167377471924, - "train/negative_loss": 1.5735644102096558, + "train/classification_loss": 0.19399510324001312, + "train/contrastive_loss": 0.2953444719314575, + "train/negative_loss": 0.29346784949302673, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.6106523275375366, - "train/total_loss": 0.6683396100997925 - }, - { - "epoch": 7.604562737642586, - "step": 2000, - "train/classification_loss": 0.24577267467975616, - "train/contrastive_loss": 1.0090378522872925, - "train/negative_loss": 1.0054996013641357, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0035383044742047787, - "train/total_loss": 0.4475802481174469 + "train/num_positives": 10, + "train/positive_loss": 0.0018766270950436592, + "train/total_loss": 0.25306400656700134 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20942839980125427, - "train/contrastive_loss": 1.6994205713272095, - "train/negative_loss": 1.1729934215545654, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.526427149772644, - "train/total_loss": 0.5493125319480896 + "train/classification_loss": 0.16145648062229156, + "train/contrastive_loss": 0.8155556321144104, + "train/negative_loss": 0.8145245313644409, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0010311153018847108, + "train/total_loss": 0.32456761598587036 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20390035212039948, - "train/contrastive_loss": 3.3355281352996826, - "train/negative_loss": 2.5678646564483643, + "train/classification_loss": 0.18451470136642456, + "train/contrastive_loss": 3.1608457565307617, + "train/negative_loss": 1.346009612083435, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.7676634788513184, - "train/total_loss": 0.8710059523582458 + "train/positive_loss": 1.8148361444473267, + "train/total_loss": 0.8166838884353638 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.18830916285514832, - "train/contrastive_loss": 3.8336565494537354, - "train/negative_loss": 2.1246612071990967, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7089953422546387, - "train/total_loss": 0.955040454864502 + "train/classification_loss": 0.19750577211380005, + "train/contrastive_loss": 2.7886009216308594, + "train/negative_loss": 1.5062581300735474, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.2823426723480225, + "train/total_loss": 0.7552259564399719 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1574951559305191, - "train/contrastive_loss": 1.0574684143066406, - "train/negative_loss": 0.9506610035896301, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.10680736601352692, - "train/total_loss": 0.36898884177207947 + "train/classification_loss": 0.2239988148212433, + "train/contrastive_loss": 1.6791869401931763, + "train/negative_loss": 1.523707389831543, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.1554795205593109, + "train/total_loss": 0.559836208820343 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1921737790107727, - "train/contrastive_loss": 1.3146706819534302, - "train/negative_loss": 1.1052671670913696, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.20940352976322174, - "train/total_loss": 0.4551079273223877 + "train/classification_loss": 0.23329736292362213, + "train/contrastive_loss": 1.4122387170791626, + "train/negative_loss": 1.0055705308914185, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.40666818618774414, + "train/total_loss": 0.5157451033592224 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20184588432312012, - "train/contrastive_loss": 1.5963292121887207, - "train/negative_loss": 1.5774725675582886, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.018856603652238846, - "train/total_loss": 0.5211117267608643 + "train/classification_loss": 0.1416924148797989, + "train/contrastive_loss": 1.7027676105499268, + "train/negative_loss": 1.6979366540908813, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.004831010941416025, + "train/total_loss": 0.48224592208862305 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.19180163741111755, - "train/contrastive_loss": 2.143568515777588, - "train/negative_loss": 2.075841188430786, + "train/classification_loss": 0.19002702832221985, + "train/contrastive_loss": 1.052809476852417, + "train/negative_loss": 0.48256024718284607, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.06772740930318832, - "train/total_loss": 0.6205153465270996 + "train/num_positives": 8, + "train/positive_loss": 0.5702492594718933, + "train/total_loss": 0.4005889296531677 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16881020367145538, - "train/contrastive_loss": 0.795946478843689, - "train/negative_loss": 0.7678190469741821, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.02812742441892624, - "train/total_loss": 0.3279995024204254 + "train/classification_loss": 0.24436832964420319, + "train/contrastive_loss": 2.652658224105835, + "train/negative_loss": 2.5322282314300537, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.12043005228042603, + "train/total_loss": 0.774899959564209 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20318828523159027, - "train/contrastive_loss": 3.122394323348999, - "train/negative_loss": 2.6416938304901123, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.4807005524635315, - "train/total_loss": 0.8276671767234802 + "train/classification_loss": 0.2173294723033905, + "train/contrastive_loss": 1.050851583480835, + "train/negative_loss": 0.41586580872535706, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.6349857449531555, + "train/total_loss": 0.42749977111816406 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.21516050398349762, - "train/contrastive_loss": 1.3100075721740723, - "train/negative_loss": 0.5911017060279846, + "train/classification_loss": 0.2557370960712433, + "train/contrastive_loss": 3.507844924926758, + "train/negative_loss": 1.7896414995193481, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.7189058065414429, - "train/total_loss": 0.4771620035171509 + "train/num_positives": 8, + "train/positive_loss": 1.7182034254074097, + "train/total_loss": 0.9573061466217041 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16688789427280426, - "train/contrastive_loss": 2.337801933288574, - "train/negative_loss": 0.9640027284622192, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.3737993240356445, - "train/total_loss": 0.6344482898712158 + "train/classification_loss": 0.15647295117378235, + "train/contrastive_loss": 1.9243996143341064, + "train/negative_loss": 0.8473648428916931, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 1.077034831047058, + "train/total_loss": 0.5413528680801392 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.138629749417305, - "train/contrastive_loss": 1.5183663368225098, - "train/negative_loss": 0.6795521974563599, - "train/num_negatives": 40, + "train/classification_loss": 0.19858531653881073, + "train/contrastive_loss": 3.264824628829956, + "train/negative_loss": 1.9236528873443604, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8388140797615051, - "train/total_loss": 0.44230300188064575 + "train/positive_loss": 1.3411717414855957, + "train/total_loss": 0.851550281047821 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.2969335615634918, - "train/contrastive_loss": 3.1722028255462646, - "train/negative_loss": 1.2512099742889404, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.9209928512573242, - "train/total_loss": 0.931374192237854 + "train/classification_loss": 0.18637149035930634, + "train/contrastive_loss": 0.8652422428131104, + "train/negative_loss": 0.8648046851158142, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00043756456580013037, + "train/total_loss": 0.35941994190216064 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.11085063219070435, - "train/contrastive_loss": 0.40473005175590515, - "train/negative_loss": 0.40472668409347534, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 3.3676692510198336e-06, - "train/total_loss": 0.19179664552211761 + "train/classification_loss": 0.23737040162086487, + "train/contrastive_loss": 1.315877914428711, + "train/negative_loss": 1.2596700191497803, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.05620790645480156, + "train/total_loss": 0.5005459785461426 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.15130729973316193, - "train/contrastive_loss": 0.6556370854377747, - "train/negative_loss": 0.22013774514198303, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.4354993402957916, - "train/total_loss": 0.28243470191955566 + "train/classification_loss": 0.17482119798660278, + "train/contrastive_loss": 0.5855051279067993, + "train/negative_loss": 0.49711862206459045, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.08838652074337006, + "train/total_loss": 0.2919222116470337 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.11103592813014984, - "train/contrastive_loss": 0.7518661022186279, - "train/negative_loss": 0.7333263158798218, + "train/classification_loss": 0.3261856138706207, + "train/contrastive_loss": 3.35722017288208, + "train/negative_loss": 2.8081116676330566, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.018539762124419212, - "train/total_loss": 0.2614091634750366 + "train/num_positives": 18, + "train/positive_loss": 0.5491083860397339, + "train/total_loss": 0.9976296424865723 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.19888342916965485, - "train/contrastive_loss": 0.7062749862670898, - "train/negative_loss": 0.586571991443634, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.11970296502113342, - "train/total_loss": 0.34013843536376953 + "train/classification_loss": 0.1665060967206955, + "train/contrastive_loss": 2.3770527839660645, + "train/negative_loss": 1.1813523769378662, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.1957004070281982, + "train/total_loss": 0.6419166326522827 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.15981309115886688, - "train/contrastive_loss": 1.4523539543151855, - "train/negative_loss": 0.9135475158691406, + "train/classification_loss": 0.19585020840168, + "train/contrastive_loss": 2.3128790855407715, + "train/negative_loss": 1.997403860092163, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.5388064384460449, - "train/total_loss": 0.45028388500213623 + "train/positive_loss": 0.3154752850532532, + "train/total_loss": 0.65842604637146 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.15552787482738495, - "train/contrastive_loss": 0.497802734375, - "train/negative_loss": 0.4977577030658722, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 4.502255978877656e-05, - "train/total_loss": 0.2550884187221527 + "train/classification_loss": 0.26863744854927063, + "train/contrastive_loss": 1.9115461111068726, + "train/negative_loss": 1.9073971509933472, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 0.004148912150412798, + "train/total_loss": 0.6509466767311096 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.19367560744285583, - "train/contrastive_loss": 2.0883357524871826, - "train/negative_loss": 0.800537645816803, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2877981662750244, - "train/total_loss": 0.6113427877426147 + "train/classification_loss": 0.20195668935775757, + "train/contrastive_loss": 2.6705875396728516, + "train/negative_loss": 1.3570350408554077, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.3135526180267334, + "train/total_loss": 0.7360742092132568 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.2277127504348755, - "train/contrastive_loss": 2.5091609954833984, - "train/negative_loss": 1.7388274669647217, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7703334093093872, - "train/total_loss": 0.7295449376106262 + "train/classification_loss": 0.14928652346134186, + "train/contrastive_loss": 0.4415435791015625, + "train/negative_loss": 0.1442383974790573, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.2973051965236664, + "train/total_loss": 0.23759523034095764 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.18810832500457764, - "train/contrastive_loss": 1.5860930681228638, - "train/negative_loss": 0.7384803891181946, + "train/classification_loss": 0.21754610538482666, + "train/contrastive_loss": 0.9183329939842224, + "train/negative_loss": 0.8456249237060547, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8476126790046692, - "train/total_loss": 0.5053269863128662 + "train/num_positives": 8, + "train/positive_loss": 0.07270805537700653, + "train/total_loss": 0.4012126922607422 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.17881536483764648, - "train/contrastive_loss": 2.7698986530303955, - "train/negative_loss": 2.15185546875, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6180431842803955, - "train/total_loss": 0.7327951192855835 + "train/classification_loss": 0.2064519226551056, + "train/contrastive_loss": 1.0396910905838013, + "train/negative_loss": 0.7583673596382141, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.28132373094558716, + "train/total_loss": 0.4143901467323303 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.24741697311401367, - "train/contrastive_loss": 2.630859851837158, - "train/negative_loss": 1.460553765296936, - "train/num_negatives": 46, + "train/classification_loss": 0.3096502721309662, + "train/contrastive_loss": 3.450502872467041, + "train/negative_loss": 1.6730321645736694, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 1.1703060865402222, - "train/total_loss": 0.7735889554023743 + "train/positive_loss": 1.777470588684082, + "train/total_loss": 0.9997508525848389 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.20398138463497162, - "train/contrastive_loss": 3.0517756938934326, - "train/negative_loss": 2.01479172706604, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.0369839668273926, - "train/total_loss": 0.8143365383148193 + "train/classification_loss": 0.14425420761108398, + "train/contrastive_loss": 1.5759310722351074, + "train/negative_loss": 0.5687820315361023, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.00714910030365, + "train/total_loss": 0.4594404399394989 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1790669709444046, - "train/contrastive_loss": 2.675906181335449, - "train/negative_loss": 2.5105106830596924, + "train/classification_loss": 0.15498444437980652, + "train/contrastive_loss": 0.9943720698356628, + "train/negative_loss": 0.39699310064315796, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.16539549827575684, - "train/total_loss": 0.7142481803894043 + "train/positive_loss": 0.5973789691925049, + "train/total_loss": 0.3538588583469391 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.1753116250038147, + "train/contrastive_loss": 1.2349880933761597, + "train/negative_loss": 0.8611277937889099, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.37386029958724976, + "train/total_loss": 0.4223092496395111 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.23147188127040863, - "train/contrastive_loss": 3.284961700439453, - "train/negative_loss": 2.433438777923584, + "train/classification_loss": 0.20669427514076233, + "train/contrastive_loss": 2.516334056854248, + "train/negative_loss": 1.600029468536377, "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.9163047075271606, + "train/total_loss": 0.7099610567092896 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.2280310094356537, + "train/contrastive_loss": 1.7300918102264404, + "train/negative_loss": 0.9287343621253967, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.8013574481010437, + "train/total_loss": 0.5740493535995483 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.1291375607252121, + "train/contrastive_loss": 0.3905165195465088, + "train/negative_loss": 0.36405906081199646, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.026457473635673523, + "train/total_loss": 0.20724086463451385 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.18336929380893707, + "train/contrastive_loss": 2.472332000732422, + "train/negative_loss": 0.8201510310173035, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 0.8515230417251587, - "train/total_loss": 0.8884642720222473 + "train/positive_loss": 1.6521809101104736, + "train/total_loss": 0.6778357028961182 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.21087293326854706, - "train/contrastive_loss": 3.6380438804626465, - "train/negative_loss": 2.7292826175689697, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9087611436843872, - "train/total_loss": 0.9384817481040955 + "train/classification_loss": 0.26893728971481323, + "train/contrastive_loss": 2.540144205093384, + "train/negative_loss": 2.33729887008667, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 0.20284537971019745, + "train/total_loss": 0.7769661545753479 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.15116026997566223, + "train/contrastive_loss": 3.666731357574463, + "train/negative_loss": 1.3440535068511963, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.3226778507232666, + "train/total_loss": 0.8845065832138062 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.19742503762245178, + "train/contrastive_loss": 1.1862914562225342, + "train/negative_loss": 0.8539636731147766, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.3323277235031128, + "train/total_loss": 0.43468332290649414 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.19969873130321503, + "train/contrastive_loss": 2.613133668899536, + "train/negative_loss": 0.7444072365760803, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.868726372718811, + "train/total_loss": 0.7223255038261414 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.2523042559623718, - "train/contrastive_loss": 3.360802173614502, - "train/negative_loss": 1.6016154289245605, + "train/classification_loss": 0.1827583760023117, + "train/contrastive_loss": 2.811319589614868, + "train/negative_loss": 2.811307430267334, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.224303832714213e-05, + "train/total_loss": 0.7450222969055176 + }, + { + "epoch": 7.042253521126761, + "step": 2000, + "train/classification_loss": 0.18829362094402313, + "train/contrastive_loss": 1.503467082977295, + "train/negative_loss": 0.5310150980949402, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.7591866254806519, - "train/total_loss": 0.9244647026062012 + "train/positive_loss": 0.9724519848823547, + "train/total_loss": 0.4889870285987854 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.1853431761264801, - "train/contrastive_loss": 0.7267683744430542, - "train/negative_loss": 0.7010278105735779, + "train/classification_loss": 0.2116677165031433, + "train/contrastive_loss": 1.8518648147583008, + "train/negative_loss": 1.1245393753051758, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.02574053965508938, - "train/total_loss": 0.33069685101509094 + "train/num_positives": 8, + "train/positive_loss": 0.727325439453125, + "train/total_loss": 0.5820406675338745 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.16749586164951324, - "train/contrastive_loss": 1.6338083744049072, - "train/negative_loss": 1.236406683921814, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.39740175008773804, - "train/total_loss": 0.4942575693130493 + "train/classification_loss": 0.18907849490642548, + "train/contrastive_loss": 3.509683132171631, + "train/negative_loss": 1.1446689367294312, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.36501407623291, + "train/total_loss": 0.8910151720046997 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.159888356924057, - "train/contrastive_loss": 2.096015214920044, - "train/negative_loss": 0.7528360486030579, - "train/num_negatives": 46, + "train/classification_loss": 0.2407016158103943, + "train/contrastive_loss": 2.019270896911621, + "train/negative_loss": 1.208043098449707, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.3431791067123413, - "train/total_loss": 0.5790914297103882 + "train/positive_loss": 0.8112277984619141, + "train/total_loss": 0.6445558071136475 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.24716559052467346, - "train/contrastive_loss": 1.4255017042160034, - "train/negative_loss": 1.4255017042160034, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5322659015655518 - }, - { - "epoch": 7.604562737642586, - "eval_exact_match_accuracy": 0.2723809523809524, - "eval_hamming_loss": 0.0695798319327731, - "eval_loss": 0.5608550906181335, - "eval_macro_f1": 0.2395544890951816, - "eval_macro_precision": 0.4592908911385675, - "eval_macro_recall": 0.18243077867984092, - "eval_micro_f1": 0.5152224824355972, - "eval_micro_precision": 0.8208955223880597, - "eval_micro_recall": 0.37542662116040953, - "eval_runtime": 2.6316, - "eval_samples_per_second": 199.497, - "eval_steps_per_second": 25.08, + "train/classification_loss": 0.18559277057647705, + "train/contrastive_loss": 0.8697998523712158, + "train/negative_loss": 0.5192899703979492, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.350509911775589, + "train/total_loss": 0.3595527410507202 + }, + { + "epoch": 7.042253521126761, + "eval_exact_match_accuracy": 0.24338624338624337, + "eval_hamming_loss": 0.07148044402946364, + "eval_loss": 0.5932103991508484, + "eval_macro_f1": 0.2869839196785755, + "eval_macro_precision": 0.5377193414857824, + "eval_macro_recall": 0.22395556754608176, + "eval_micro_f1": 0.4768413059984814, + "eval_micro_precision": 0.8284960422163589, + "eval_micro_recall": 0.3347547974413646, + "eval_runtime": 2.8406, + "eval_samples_per_second": 199.609, + "eval_steps_per_second": 24.995, "step": 2000 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.15970121324062347, - "train/contrastive_loss": 1.0793523788452148, - "train/negative_loss": 1.0791679620742798, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.00018446551985107362, - "train/total_loss": 0.37557169795036316 + "train/classification_loss": 0.19512946903705597, + "train/contrastive_loss": 1.394766926765442, + "train/negative_loss": 1.1764943599700928, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.2182726114988327, + "train/total_loss": 0.474082887172699 }, { - "epoch": 7.604562737642586, + "epoch": 7.042253521126761, "step": 2000, - "train/classification_loss": 0.22743454575538635, - "train/contrastive_loss": 1.9560699462890625, - "train/negative_loss": 1.9476550817489624, - "train/num_negatives": 38, - "train/num_positives": 10, - "train/positive_loss": 0.008414804935455322, - "train/total_loss": 0.6186485290527344 + "train/classification_loss": 0.14290325343608856, + "train/contrastive_loss": 0.8412747979164124, + "train/negative_loss": 0.8009767532348633, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.040298063308000565, + "train/total_loss": 0.3111582100391388 }, { - "epoch": 7.79467680608365, - "grad_norm": 16.926349639892578, - "learning_rate": 1.970365296803653e-05, - "loss": 0.7864, + "epoch": 7.21830985915493, + "grad_norm": 9.392231941223145, + "learning_rate": 1.972572233967583e-05, + "loss": 0.7174, "step": 2050 }, { - "epoch": 7.79467680608365, + "epoch": 7.21830985915493, "step": 2050, - "train/classification_loss": 0.20321263372898102, - "train/contrastive_loss": 2.187316417694092, - "train/negative_loss": 1.3580164909362793, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.8292998671531677, - "train/total_loss": 0.6406759023666382 + "train/classification_loss": 0.20707447826862335, + "train/contrastive_loss": 0.46742427349090576, + "train/negative_loss": 0.37921902537345886, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.0882052481174469, + "train/total_loss": 0.3005593419075012 }, { - "epoch": 7.79467680608365, + "epoch": 7.21830985915493, "step": 2050, - "train/classification_loss": 0.18674755096435547, - "train/contrastive_loss": 1.3275718688964844, - "train/negative_loss": 0.6868754625320435, - "train/num_negatives": 40, - "train/num_positives": 8, - "train/positive_loss": 0.6406964063644409, - "train/total_loss": 0.45226192474365234 + "train/classification_loss": 0.16357415914535522, + "train/contrastive_loss": 0.7880473732948303, + "train/negative_loss": 0.43332773447036743, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3547196388244629, + "train/total_loss": 0.32118362188339233 }, { - "epoch": 7.984790874524715, - "grad_norm": 13.207832336425781, - "learning_rate": 1.9696042617960426e-05, - "loss": 0.781, + "epoch": 7.394366197183099, + "grad_norm": 13.048248291015625, + "learning_rate": 1.9718675123326286e-05, + "loss": 0.7735, "step": 2100 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2406453788280487, - "train/contrastive_loss": 2.4808759689331055, - "train/negative_loss": 0.8370329737663269, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.6438430547714233, - "train/total_loss": 0.7368205785751343 + "train/classification_loss": 0.2355850785970688, + "train/contrastive_loss": 1.9243850708007812, + "train/negative_loss": 1.3720566034317017, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5523284673690796, + "train/total_loss": 0.6204621195793152 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.20677006244659424, - "train/contrastive_loss": 1.382346272468567, - "train/negative_loss": 1.1022403240203857, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.28010591864585876, - "train/total_loss": 0.4832393229007721 + "train/classification_loss": 0.2805800139904022, + "train/contrastive_loss": 2.2836239337921143, + "train/negative_loss": 0.8140482902526855, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.4695756435394287, + "train/total_loss": 0.7373048067092896 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15407142043113708, - "train/contrastive_loss": 2.3497872352600098, - "train/negative_loss": 0.6794371604919434, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.670350193977356, - "train/total_loss": 0.6240288615226746 + "train/classification_loss": 0.2488636076450348, + "train/contrastive_loss": 2.5649256706237793, + "train/negative_loss": 1.4715982675552368, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.0933274030685425, + "train/total_loss": 0.7618488073348999 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.18043629825115204, - "train/contrastive_loss": 2.17608904838562, - "train/negative_loss": 1.449393630027771, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.7266954779624939, - "train/total_loss": 0.6156541109085083 + "train/classification_loss": 0.13060618937015533, + "train/contrastive_loss": 0.8548005819320679, + "train/negative_loss": 0.8200228810310364, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.03477772697806358, + "train/total_loss": 0.30156630277633667 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.14387649297714233, - "train/contrastive_loss": 1.5560455322265625, - "train/negative_loss": 1.0251407623291016, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5309047698974609, - "train/total_loss": 0.4550856053829193 + "train/classification_loss": 0.2158774733543396, + "train/contrastive_loss": 2.6734330654144287, + "train/negative_loss": 2.255758047103882, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.41767510771751404, + "train/total_loss": 0.7505640983581543 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1918298751115799, - "train/contrastive_loss": 2.3336539268493652, - "train/negative_loss": 1.5252022743225098, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.808451771736145, - "train/total_loss": 0.6585606932640076 + "train/classification_loss": 0.2009315937757492, + "train/contrastive_loss": 2.5592880249023438, + "train/negative_loss": 1.6822422742843628, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8770458698272705, + "train/total_loss": 0.7127892374992371 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22570137679576874, - "train/contrastive_loss": 1.8155590295791626, - "train/negative_loss": 1.1220539808273315, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.693505048751831, - "train/total_loss": 0.5888131856918335 + "train/classification_loss": 0.1938031017780304, + "train/contrastive_loss": 1.9480438232421875, + "train/negative_loss": 1.1423985958099365, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.805645227432251, + "train/total_loss": 0.5834118723869324 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.16947361826896667, - "train/contrastive_loss": 1.9469965696334839, - "train/negative_loss": 1.7367358207702637, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.2102607637643814, - "train/total_loss": 0.5588729381561279 + "train/classification_loss": 0.21119935810565948, + "train/contrastive_loss": 1.7656980752944946, + "train/negative_loss": 1.7656002044677734, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 9.787561430130154e-05, + "train/total_loss": 0.5643389821052551 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1483248472213745, - "train/contrastive_loss": 1.3436309099197388, - "train/negative_loss": 1.2688852548599243, + "train/classification_loss": 0.10881562530994415, + "train/contrastive_loss": 0.5218908190727234, + "train/negative_loss": 0.2153853327035904, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.07474564760923386, - "train/total_loss": 0.4170510470867157 + "train/positive_loss": 0.3065054714679718, + "train/total_loss": 0.21319378912448883 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.3079093396663666, - "train/contrastive_loss": 3.029447317123413, - "train/negative_loss": 1.5586564540863037, + "train/classification_loss": 0.21974939107894897, + "train/contrastive_loss": 2.9008002281188965, + "train/negative_loss": 1.8823362588882446, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4707908630371094, - "train/total_loss": 0.9137988090515137 + "train/num_positives": 14, + "train/positive_loss": 1.0184640884399414, + "train/total_loss": 0.7999094724655151 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19394029676914215, - "train/contrastive_loss": 2.189574718475342, - "train/negative_loss": 1.5678144693374634, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6217602491378784, - "train/total_loss": 0.6318552494049072 + "train/classification_loss": 0.15743964910507202, + "train/contrastive_loss": 1.6973141431808472, + "train/negative_loss": 0.9312524199485779, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.7660617232322693, + "train/total_loss": 0.4969024956226349 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.13232888281345367, - "train/contrastive_loss": 1.9863225221633911, - "train/negative_loss": 0.6504867076873779, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.3358358144760132, - "train/total_loss": 0.5295934081077576 + "train/classification_loss": 0.18000084161758423, + "train/contrastive_loss": 2.4370360374450684, + "train/negative_loss": 1.3035897016525269, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.133446455001831, + "train/total_loss": 0.6674080491065979 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.21595707535743713, - "train/contrastive_loss": 2.910799980163574, - "train/negative_loss": 1.7329236268997192, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.1778762340545654, - "train/total_loss": 0.7981170415878296 + "train/classification_loss": 0.20252205431461334, + "train/contrastive_loss": 4.0921549797058105, + "train/negative_loss": 1.9788979291915894, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.1132569313049316, + "train/total_loss": 1.0209530591964722 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.13580238819122314, - "train/contrastive_loss": 2.319345712661743, - "train/negative_loss": 2.3147056102752686, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.004640192724764347, - "train/total_loss": 0.5996715426445007 + "train/classification_loss": 0.1931208223104477, + "train/contrastive_loss": 0.9694631695747375, + "train/negative_loss": 0.7264527082443237, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.24301044642925262, + "train/total_loss": 0.3870134651660919 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.13929709792137146, - "train/contrastive_loss": 1.8290828466415405, - "train/negative_loss": 1.4624388217926025, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.3666440546512604, - "train/total_loss": 0.5051136612892151 + "train/classification_loss": 0.14310020208358765, + "train/contrastive_loss": 3.136925220489502, + "train/negative_loss": 0.9973586797714233, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.139566421508789, + "train/total_loss": 0.7704852819442749 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1469770073890686, - "train/contrastive_loss": 0.5510554313659668, - "train/negative_loss": 0.45692917704582214, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.09412623196840286, - "train/total_loss": 0.257188081741333 + "train/classification_loss": 0.17020396888256073, + "train/contrastive_loss": 0.86734938621521, + "train/negative_loss": 0.6761361956596375, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.19121317565441132, + "train/total_loss": 0.34367385506629944 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22150512039661407, - "train/contrastive_loss": 2.550544261932373, - "train/negative_loss": 1.8260353803634644, - "train/num_negatives": 40, + "train/classification_loss": 0.12875641882419586, + "train/contrastive_loss": 1.9166319370269775, + "train/negative_loss": 1.196470856666565, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.7245088815689087, - "train/total_loss": 0.7316139936447144 + "train/positive_loss": 0.7201610207557678, + "train/total_loss": 0.5120828151702881 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.16326695680618286, - "train/contrastive_loss": 0.8272742033004761, - "train/negative_loss": 0.4306049942970276, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.3966692388057709, - "train/total_loss": 0.328721821308136 + "train/classification_loss": 0.19211642444133759, + "train/contrastive_loss": 0.7449772357940674, + "train/negative_loss": 0.32287636399269104, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.42210087180137634, + "train/total_loss": 0.3411118686199188 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.18060752749443054, - "train/contrastive_loss": 1.2686816453933716, - "train/negative_loss": 1.263410210609436, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.005271493922919035, - "train/total_loss": 0.4343438744544983 + "train/classification_loss": 0.161703422665596, + "train/contrastive_loss": 0.9431514143943787, + "train/negative_loss": 0.9366201162338257, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.006531290244311094, + "train/total_loss": 0.35033369064331055 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15130774676799774, - "train/contrastive_loss": 1.199607491493225, - "train/negative_loss": 0.812043309211731, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.38756421208381653, - "train/total_loss": 0.3912292420864105 + "train/classification_loss": 0.19374893605709076, + "train/contrastive_loss": 4.162308692932129, + "train/negative_loss": 1.705967903137207, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.4563405513763428, + "train/total_loss": 1.0262106657028198 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22401319444179535, - "train/contrastive_loss": 1.5085980892181396, - "train/negative_loss": 0.3489173650741577, - "train/num_negatives": 44, + "train/classification_loss": 0.14964060485363007, + "train/contrastive_loss": 1.930443525314331, + "train/negative_loss": 1.869929313659668, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.159680724143982, - "train/total_loss": 0.5257328152656555 + "train/positive_loss": 0.06051427125930786, + "train/total_loss": 0.5357292890548706 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.24623171985149384, - "train/contrastive_loss": 1.2948957681655884, - "train/negative_loss": 1.2658287286758423, - "train/num_negatives": 44, + "train/classification_loss": 0.1389130800962448, + "train/contrastive_loss": 3.3842926025390625, + "train/negative_loss": 2.657822608947754, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.029066983610391617, - "train/total_loss": 0.5052108764648438 + "train/positive_loss": 0.7264699935913086, + "train/total_loss": 0.8157716393470764 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.14000633358955383, - "train/contrastive_loss": 1.2941904067993164, - "train/negative_loss": 0.3640783429145813, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9301120638847351, - "train/total_loss": 0.3988444209098816 + "train/classification_loss": 0.17792023718357086, + "train/contrastive_loss": 2.513064384460449, + "train/negative_loss": 2.0533604621887207, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.45970404148101807, + "train/total_loss": 0.6805331110954285 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1363397240638733, - "train/contrastive_loss": 0.32203370332717896, - "train/negative_loss": 0.3148648738861084, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.007168828975409269, - "train/total_loss": 0.20074647665023804 + "train/classification_loss": 0.23604583740234375, + "train/contrastive_loss": 2.593393325805664, + "train/negative_loss": 1.6502387523651123, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.9431546926498413, + "train/total_loss": 0.7547245025634766 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.11134833842515945, - "train/contrastive_loss": 1.1241161823272705, - "train/negative_loss": 0.6101117730140686, + "train/classification_loss": 0.1863241195678711, + "train/contrastive_loss": 2.0253219604492188, + "train/negative_loss": 1.1448673009872437, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5140044689178467, - "train/total_loss": 0.33617156744003296 + "train/num_positives": 10, + "train/positive_loss": 0.8804546594619751, + "train/total_loss": 0.5913885235786438 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.26296117901802063, - "train/contrastive_loss": 1.0945403575897217, - "train/negative_loss": 0.33508118987083435, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.7594591975212097, - "train/total_loss": 0.48186925053596497 + "train/classification_loss": 0.21107758581638336, + "train/contrastive_loss": 2.7217471599578857, + "train/negative_loss": 2.1596999168395996, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.5620473027229309, + "train/total_loss": 0.7554270029067993 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2652978301048279, - "train/contrastive_loss": 2.9645118713378906, - "train/negative_loss": 1.5412453413009644, + "train/classification_loss": 0.1976681649684906, + "train/contrastive_loss": 1.715854287147522, + "train/negative_loss": 1.7118229866027832, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.4232664108276367, - "train/total_loss": 0.858200192451477 + "train/num_positives": 4, + "train/positive_loss": 0.004031301010400057, + "train/total_loss": 0.5408390164375305 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.17945340275764465, - "train/contrastive_loss": 2.63338565826416, - "train/negative_loss": 2.2780508995056152, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.35533463954925537, - "train/total_loss": 0.7061305046081543 + "train/classification_loss": 0.17681534588336945, + "train/contrastive_loss": 0.14368316531181335, + "train/negative_loss": 0.13802795112133026, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.005655211862176657, + "train/total_loss": 0.20555198192596436 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19640874862670898, - "train/contrastive_loss": 0.9052658081054688, - "train/negative_loss": 0.506600558757782, - "train/num_negatives": 40, + "train/classification_loss": 0.27567559480667114, + "train/contrastive_loss": 2.819042205810547, + "train/negative_loss": 1.5198527574539185, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.39866527915000916, - "train/total_loss": 0.37746191024780273 + "train/positive_loss": 1.2991894483566284, + "train/total_loss": 0.8394840359687805 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22491371631622314, - "train/contrastive_loss": 1.6646255254745483, - "train/negative_loss": 1.5333529710769653, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.13127253949642181, - "train/total_loss": 0.5578387975692749 + "train/classification_loss": 0.20924969017505646, + "train/contrastive_loss": 0.3890290856361389, + "train/negative_loss": 0.3867047429084778, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.0023243350442498922, + "train/total_loss": 0.28705549240112305 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.130527526140213, - "train/contrastive_loss": 1.2858607769012451, - "train/negative_loss": 0.7142800092697144, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5715807676315308, - "train/total_loss": 0.387699693441391 + "train/classification_loss": 0.17166674137115479, + "train/contrastive_loss": 1.5331645011901855, + "train/negative_loss": 1.520494818687439, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.012669644318521023, + "train/total_loss": 0.47829964756965637 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.21956101059913635, - "train/contrastive_loss": 1.7216063737869263, - "train/negative_loss": 0.9733742475509644, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7482321262359619, - "train/total_loss": 0.5638822913169861 + "train/classification_loss": 0.16858166456222534, + "train/contrastive_loss": 2.918395757675171, + "train/negative_loss": 2.204179048538208, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7142167091369629, + "train/total_loss": 0.7522608041763306 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2498248964548111, - "train/contrastive_loss": 1.0058456659317017, - "train/negative_loss": 1.00518000125885, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.000665707397274673, - "train/total_loss": 0.45099401473999023 + "train/classification_loss": 0.19467951357364655, + "train/contrastive_loss": 1.0604459047317505, + "train/negative_loss": 0.48637786507606506, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5740680694580078, + "train/total_loss": 0.40676867961883545 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2064022421836853, - "train/contrastive_loss": 1.871691107749939, - "train/negative_loss": 1.2635945081710815, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.6080965995788574, - "train/total_loss": 0.5807404518127441 + "train/classification_loss": 0.21877193450927734, + "train/contrastive_loss": 2.194817304611206, + "train/negative_loss": 1.7197083234786987, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.47510895133018494, + "train/total_loss": 0.6577354073524475 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1901632696390152, - "train/contrastive_loss": 3.894577980041504, - "train/negative_loss": 2.4027152061462402, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4918626546859741, - "train/total_loss": 0.9690788388252258 + "train/classification_loss": 0.23548386991024017, + "train/contrastive_loss": 1.9063204526901245, + "train/negative_loss": 1.3938144445419312, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5125060081481934, + "train/total_loss": 0.6167479753494263 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.17786064743995667, - "train/contrastive_loss": 4.095897197723389, - "train/negative_loss": 1.4728835821151733, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.623013496398926, - "train/total_loss": 0.9970401525497437 + "train/classification_loss": 0.15225757658481598, + "train/contrastive_loss": 2.207214832305908, + "train/negative_loss": 2.2071568965911865, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 5.7984703744295985e-05, + "train/total_loss": 0.5937005281448364 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15590515732765198, - "train/contrastive_loss": 1.267581582069397, - "train/negative_loss": 0.842531144618988, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.42505043745040894, - "train/total_loss": 0.40942147374153137 + "train/classification_loss": 0.19602622091770172, + "train/contrastive_loss": 0.8796312212944031, + "train/negative_loss": 0.6032993793487549, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.2763318419456482, + "train/total_loss": 0.37195247411727905 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19465456902980804, - "train/contrastive_loss": 1.687809705734253, - "train/negative_loss": 1.0547823905944824, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.6330272555351257, - "train/total_loss": 0.532216489315033 + "train/classification_loss": 0.24723008275032043, + "train/contrastive_loss": 2.630075454711914, + "train/negative_loss": 2.3886241912841797, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.24145132303237915, + "train/total_loss": 0.7732452154159546 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.21194936335086823, - "train/contrastive_loss": 2.2923460006713867, - "train/negative_loss": 2.0208756923675537, - "train/num_negatives": 46, + "train/classification_loss": 0.2137121856212616, + "train/contrastive_loss": 0.9918572902679443, + "train/negative_loss": 0.474529892206192, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.5173274278640747, + "train/total_loss": 0.41208362579345703 + }, + { + "epoch": 7.394366197183099, + "step": 2100, + "train/classification_loss": 0.2880937159061432, + "train/contrastive_loss": 3.541677236557007, + "train/negative_loss": 1.4077179431915283, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.27147042751312256, - "train/total_loss": 0.6704185605049133 + "train/positive_loss": 2.1339592933654785, + "train/total_loss": 0.9964292049407959 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.18587909638881683, - "train/contrastive_loss": 2.0996501445770264, - "train/negative_loss": 2.079890489578247, + "train/classification_loss": 0.14877694845199585, + "train/contrastive_loss": 1.132318139076233, + "train/negative_loss": 0.7275153398513794, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.019759582355618477, - "train/total_loss": 0.6058091521263123 + "train/num_positives": 10, + "train/positive_loss": 0.4048027992248535, + "train/total_loss": 0.3752405643463135 + }, + { + "epoch": 7.394366197183099, + "step": 2100, + "train/classification_loss": 0.18981721997261047, + "train/contrastive_loss": 3.654658555984497, + "train/negative_loss": 2.8217084407806396, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.8329501748085022, + "train/total_loss": 0.9207489490509033 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.16068419814109802, - "train/contrastive_loss": 0.8177267909049988, - "train/negative_loss": 0.8158565163612366, + "train/classification_loss": 0.1946374624967575, + "train/contrastive_loss": 1.383418321609497, + "train/negative_loss": 1.3825664520263672, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0008519234834238887, + "train/total_loss": 0.47132110595703125 + }, + { + "epoch": 7.394366197183099, + "step": 2100, + "train/classification_loss": 0.2662365436553955, + "train/contrastive_loss": 2.085479259490967, + "train/negative_loss": 1.7236754894256592, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.0018702736124396324, - "train/total_loss": 0.32422953844070435 + "train/positive_loss": 0.3618038594722748, + "train/total_loss": 0.6833324432373047 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19491207599639893, - "train/contrastive_loss": 2.8049683570861816, - "train/negative_loss": 2.203845262527466, - "train/num_negatives": 36, + "train/classification_loss": 0.18046359717845917, + "train/contrastive_loss": 0.5860280990600586, + "train/negative_loss": 0.5711997151374817, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.014828408136963844, + "train/total_loss": 0.2976692318916321 + }, + { + "epoch": 7.394366197183099, + "step": 2100, + "train/classification_loss": 0.31441617012023926, + "train/contrastive_loss": 1.8963901996612549, + "train/negative_loss": 1.2531230449676514, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.6011231541633606, - "train/total_loss": 0.7559057474136353 + "train/positive_loss": 0.6432670950889587, + "train/total_loss": 0.6936942338943481 + }, + { + "epoch": 7.394366197183099, + "step": 2100, + "train/classification_loss": 0.16098926961421967, + "train/contrastive_loss": 2.4503560066223145, + "train/negative_loss": 1.1020476818084717, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.3483083248138428, + "train/total_loss": 0.6510604619979858 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22287388145923615, - "train/contrastive_loss": 1.3788912296295166, - "train/negative_loss": 0.7029107809066772, + "train/classification_loss": 0.19906562566757202, + "train/contrastive_loss": 2.5203075408935547, + "train/negative_loss": 2.0850064754486084, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.6759804487228394, - "train/total_loss": 0.4986521601676941 + "train/num_positives": 14, + "train/positive_loss": 0.43530112504959106, + "train/total_loss": 0.7031271457672119 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1593582034111023, - "train/contrastive_loss": 1.70096755027771, - "train/negative_loss": 1.4089702367782593, + "train/classification_loss": 0.24975664913654327, + "train/contrastive_loss": 2.529301881790161, + "train/negative_loss": 2.529297113418579, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.2919972538948059, - "train/total_loss": 0.4995517134666443 + "train/num_positives": 2, + "train/positive_loss": 4.64917320641689e-06, + "train/total_loss": 0.7556170225143433 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.14075559377670288, - "train/contrastive_loss": 1.325274109840393, - "train/negative_loss": 0.8002511858940125, + "train/classification_loss": 0.18246497213840485, + "train/contrastive_loss": 2.2353734970092773, + "train/negative_loss": 1.3504908084869385, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5250229239463806, - "train/total_loss": 0.4058104157447815 + "train/num_positives": 16, + "train/positive_loss": 0.8848828077316284, + "train/total_loss": 0.6295396685600281 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.27061927318573, - "train/contrastive_loss": 1.7263137102127075, - "train/negative_loss": 1.2182928323745728, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.5080208778381348, - "train/total_loss": 0.6158820390701294 + "train/classification_loss": 0.13839206099510193, + "train/contrastive_loss": 0.48033958673477173, + "train/negative_loss": 0.33591514825820923, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.1444244384765625, + "train/total_loss": 0.2344599813222885 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.11641211807727814, - "train/contrastive_loss": 0.47647514939308167, - "train/negative_loss": 0.476345032453537, - "train/num_negatives": 48, + "train/classification_loss": 0.2013828158378601, + "train/contrastive_loss": 0.923154354095459, + "train/negative_loss": 0.8586488962173462, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.0001301066658925265, - "train/total_loss": 0.21170714497566223 + "train/positive_loss": 0.064505435526371, + "train/total_loss": 0.3860136866569519 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.14601458609104156, - "train/contrastive_loss": 0.5208742022514343, - "train/negative_loss": 0.19504444301128387, + "train/classification_loss": 0.213034525513649, + "train/contrastive_loss": 0.9196885228157043, + "train/negative_loss": 0.8416456580162048, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.32582977414131165, - "train/total_loss": 0.2501894235610962 + "train/num_positives": 14, + "train/positive_loss": 0.07804284989833832, + "train/total_loss": 0.3969722390174866 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1139206737279892, - "train/contrastive_loss": 0.8801314234733582, - "train/negative_loss": 0.8688578009605408, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.011273606680333614, - "train/total_loss": 0.289946973323822 + "train/classification_loss": 0.29486164450645447, + "train/contrastive_loss": 1.887904405593872, + "train/negative_loss": 1.2852332592010498, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 0.6026711463928223, + "train/total_loss": 0.6724425554275513 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19012302160263062, - "train/contrastive_loss": 0.5669975280761719, - "train/negative_loss": 0.39119046926498413, - "train/num_negatives": 28, + "train/classification_loss": 0.1399642378091812, + "train/contrastive_loss": 0.5256852507591248, + "train/negative_loss": 0.4322962462902069, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.17580704391002655, - "train/total_loss": 0.303522527217865 + "train/positive_loss": 0.09338901937007904, + "train/total_loss": 0.24510128796100616 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15658582746982574, - "train/contrastive_loss": 1.428987741470337, - "train/negative_loss": 0.7394506931304932, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6895371079444885, - "train/total_loss": 0.44238340854644775 + "train/classification_loss": 0.14409293234348297, + "train/contrastive_loss": 1.1297039985656738, + "train/negative_loss": 0.5489850640296936, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.580718994140625, + "train/total_loss": 0.37003374099731445 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15400876104831696, - "train/contrastive_loss": 0.3322228193283081, - "train/negative_loss": 0.3320090174674988, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00021379138343036175, - "train/total_loss": 0.22045332193374634 + "train/classification_loss": 0.1656644195318222, + "train/contrastive_loss": 2.506514310836792, + "train/negative_loss": 0.6568769812583923, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.8496372699737549, + "train/total_loss": 0.6669673323631287 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2039889544248581, - "train/contrastive_loss": 2.7360458374023438, - "train/negative_loss": 1.134372591972351, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.6016732454299927, - "train/total_loss": 0.7511981725692749 + "train/classification_loss": 0.21137888729572296, + "train/contrastive_loss": 3.516695499420166, + "train/negative_loss": 1.73699951171875, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.7796958684921265, + "train/total_loss": 0.914717972278595 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.23614826798439026, - "train/contrastive_loss": 2.831876277923584, - "train/negative_loss": 2.1523706912994385, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6795056462287903, - "train/total_loss": 0.8025234937667847 + "train/classification_loss": 0.20528481900691986, + "train/contrastive_loss": 1.4497418403625488, + "train/negative_loss": 0.9157915711402893, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.5339502096176147, + "train/total_loss": 0.4952331781387329 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.17856520414352417, - "train/contrastive_loss": 0.9791860580444336, - "train/negative_loss": 0.4856378734111786, + "train/classification_loss": 0.12146615982055664, + "train/contrastive_loss": 0.2809399366378784, + "train/negative_loss": 0.27169010043144226, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.4935481548309326, - "train/total_loss": 0.37440240383148193 + "train/num_positives": 16, + "train/positive_loss": 0.009249835275113583, + "train/total_loss": 0.17765414714813232 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.17304477095603943, - "train/contrastive_loss": 3.215250253677368, - "train/negative_loss": 1.8366740942001343, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3785761594772339, - "train/total_loss": 0.8160948753356934 + "train/classification_loss": 0.19084380567073822, + "train/contrastive_loss": 1.9817817211151123, + "train/negative_loss": 1.3369991779327393, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.644782543182373, + "train/total_loss": 0.5872001647949219 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.25174760818481445, - "train/contrastive_loss": 2.541818380355835, - "train/negative_loss": 1.3471684455871582, + "train/classification_loss": 0.29518944025039673, + "train/contrastive_loss": 2.743422031402588, + "train/negative_loss": 2.607961416244507, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.1946499347686768, - "train/total_loss": 0.7601112723350525 + "train/num_positives": 2, + "train/positive_loss": 0.13546055555343628, + "train/total_loss": 0.8438738584518433 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.19923652708530426, - "train/contrastive_loss": 2.392577886581421, - "train/negative_loss": 1.5630496740341187, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.829528272151947, - "train/total_loss": 0.6777521371841431 + "train/classification_loss": 0.14376363158226013, + "train/contrastive_loss": 2.569751739501953, + "train/negative_loss": 1.2280256748199463, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.3417261838912964, + "train/total_loss": 0.6577140092849731 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.1922587901353836, - "train/contrastive_loss": 3.3310916423797607, - "train/negative_loss": 2.8737237453460693, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4573678970336914, - "train/total_loss": 0.8584771156311035 + "train/classification_loss": 0.19214600324630737, + "train/contrastive_loss": 1.444541335105896, + "train/negative_loss": 1.348332166671753, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.09620921313762665, + "train/total_loss": 0.48105427622795105 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2273131012916565, - "train/contrastive_loss": 3.1888532638549805, - "train/negative_loss": 2.2606723308563232, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.9281808733940125, - "train/total_loss": 0.8650837540626526 + "train/classification_loss": 0.1902756690979004, + "train/contrastive_loss": 2.6923165321350098, + "train/negative_loss": 0.8159744143486023, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.8763420581817627, + "train/total_loss": 0.7287389636039734 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2091589868068695, - "train/contrastive_loss": 2.5276756286621094, - "train/negative_loss": 1.6672519445419312, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.8604235649108887, - "train/total_loss": 0.7146941423416138 + "train/classification_loss": 0.18975751101970673, + "train/contrastive_loss": 4.306968688964844, + "train/negative_loss": 4.306966304779053, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.610688852655585e-06, + "train/total_loss": 1.0511512756347656 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2532994747161865, - "train/contrastive_loss": 2.973903179168701, - "train/negative_loss": 1.5209722518920898, + "train/classification_loss": 0.1805657297372818, + "train/contrastive_loss": 1.6494392156600952, + "train/negative_loss": 0.5808677673339844, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.4529309272766113, - "train/total_loss": 0.8480800986289978 + "train/positive_loss": 1.0685714483261108, + "train/total_loss": 0.5104535818099976 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.18505409359931946, - "train/contrastive_loss": 0.7898645401000977, - "train/negative_loss": 0.7897539138793945, + "train/classification_loss": 0.2143731713294983, + "train/contrastive_loss": 2.3271758556365967, + "train/negative_loss": 1.2828887701034546, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00011060843826271594, - "train/total_loss": 0.3430269956588745 + "train/num_positives": 8, + "train/positive_loss": 1.044287085533142, + "train/total_loss": 0.6798083782196045 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15794280171394348, - "train/contrastive_loss": 1.5664119720458984, - "train/negative_loss": 1.212887167930603, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.353524774312973, - "train/total_loss": 0.47122520208358765 + "train/classification_loss": 0.1729976236820221, + "train/contrastive_loss": 3.203278064727783, + "train/negative_loss": 1.3971877098083496, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.806090235710144, + "train/total_loss": 0.8136532306671143 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.15526723861694336, - "train/contrastive_loss": 1.5845568180084229, - "train/negative_loss": 0.5357173085212708, - "train/num_negatives": 46, + "train/classification_loss": 0.26526975631713867, + "train/contrastive_loss": 2.9190073013305664, + "train/negative_loss": 1.8765313625335693, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0488395690917969, - "train/total_loss": 0.4721786081790924 + "train/positive_loss": 1.0424760580062866, + "train/total_loss": 0.849071204662323 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.2374057173728943, - "train/contrastive_loss": 1.4225289821624756, - "train/negative_loss": 1.4225289821624756, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5219115018844604 - }, - { - "epoch": 7.984790874524715, - "eval_exact_match_accuracy": 0.2914285714285714, - "eval_hamming_loss": 0.06756302521008403, - "eval_loss": 0.5527490973472595, - "eval_macro_f1": 0.2700091410086497, - "eval_macro_precision": 0.5056314967172818, - "eval_macro_recall": 0.20974065546266732, - "eval_micro_f1": 0.535796766743649, - "eval_micro_precision": 0.8285714285714286, - "eval_micro_recall": 0.39590443686006827, - "eval_runtime": 2.6245, - "eval_samples_per_second": 200.039, - "eval_steps_per_second": 25.148, + "train/classification_loss": 0.18941755592823029, + "train/contrastive_loss": 0.9748981595039368, + "train/negative_loss": 0.9455454349517822, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.0293527040630579, + "train/total_loss": 0.3843972086906433 + }, + { + "epoch": 7.394366197183099, + "eval_exact_match_accuracy": 0.25044091710758376, + "eval_hamming_loss": 0.0724141508455234, + "eval_loss": 0.5969284772872925, + "eval_macro_f1": 0.2802413726884585, + "eval_macro_precision": 0.4537141410850705, + "eval_macro_recall": 0.22171561528881892, + "eval_micro_f1": 0.48676470588235293, + "eval_micro_precision": 0.7843601895734598, + "eval_micro_recall": 0.35287846481876334, + "eval_runtime": 2.8364, + "eval_samples_per_second": 199.904, + "eval_steps_per_second": 25.032, "step": 2100 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.22597961127758026, - "train/contrastive_loss": 1.7244973182678223, - "train/negative_loss": 0.6761484742164612, - "train/num_negatives": 34, - "train/num_positives": 14, - "train/positive_loss": 1.0483489036560059, - "train/total_loss": 0.5708791017532349 + "train/classification_loss": 0.1787373572587967, + "train/contrastive_loss": 0.47825801372528076, + "train/negative_loss": 0.43062078952789307, + "train/num_negatives": 30, + "train/num_positives": 16, + "train/positive_loss": 0.0476372204720974, + "train/total_loss": 0.27438896894454956 }, { - "epoch": 7.984790874524715, + "epoch": 7.394366197183099, "step": 2100, - "train/classification_loss": 0.21599963307380676, - "train/contrastive_loss": 1.3685818910598755, - "train/negative_loss": 1.0195105075836182, + "train/classification_loss": 0.18938905000686646, + "train/contrastive_loss": 1.7803001403808594, + "train/negative_loss": 0.7165501713752747, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.3490713834762573, - "train/total_loss": 0.4897160232067108 + "train/num_positives": 10, + "train/positive_loss": 1.06374990940094, + "train/total_loss": 0.5454490780830383 }, { - "epoch": 8.17490494296578, - "grad_norm": 10.365729331970215, - "learning_rate": 1.9688432267884324e-05, - "loss": 0.6418, + "epoch": 7.570422535211268, + "grad_norm": 13.924952507019043, + "learning_rate": 1.9711627906976747e-05, + "loss": 0.7351, "step": 2150 }, { - "epoch": 8.17490494296578, + "epoch": 7.570422535211268, "step": 2150, - "train/classification_loss": 0.18748225271701813, - "train/contrastive_loss": 0.5769376158714294, - "train/negative_loss": 0.5490038394927979, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.02793375961482525, - "train/total_loss": 0.3028697669506073 + "train/classification_loss": 0.20502950251102448, + "train/contrastive_loss": 1.5197179317474365, + "train/negative_loss": 0.3525352478027344, + "train/num_negatives": 40, + "train/num_positives": 4, + "train/positive_loss": 1.1671826839447021, + "train/total_loss": 0.5089731216430664 }, { - "epoch": 8.17490494296578, + "epoch": 7.570422535211268, "step": 2150, - "train/classification_loss": 0.1438782662153244, - "train/contrastive_loss": 0.24318671226501465, - "train/negative_loss": 0.1954665631055832, - "train/num_negatives": 30, - "train/num_positives": 10, - "train/positive_loss": 0.04772014170885086, - "train/total_loss": 0.19251561164855957 + "train/classification_loss": 0.15141382813453674, + "train/contrastive_loss": 0.9218471050262451, + "train/negative_loss": 0.7828749418258667, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.1389721930027008, + "train/total_loss": 0.3357832431793213 }, { - "epoch": 8.365019011406844, - "grad_norm": 8.257341384887695, - "learning_rate": 1.9680821917808222e-05, - "loss": 0.7179, + "epoch": 7.746478873239437, + "grad_norm": 11.801557540893555, + "learning_rate": 1.9704580690627205e-05, + "loss": 0.7747, "step": 2200 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.24943628907203674, - "train/contrastive_loss": 1.889557123184204, - "train/negative_loss": 0.7087753415107727, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.1807818412780762, - "train/total_loss": 0.6273477077484131 + "train/classification_loss": 0.233855739235878, + "train/contrastive_loss": 2.255545139312744, + "train/negative_loss": 1.3012739419937134, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.954271137714386, + "train/total_loss": 0.6849647760391235 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.21900370717048645, - "train/contrastive_loss": 2.6147537231445312, - "train/negative_loss": 1.4769008159637451, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.1378530263900757, - "train/total_loss": 0.7419544458389282 + "train/classification_loss": 0.26522618532180786, + "train/contrastive_loss": 1.7616727352142334, + "train/negative_loss": 0.7065722942352295, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.055100440979004, + "train/total_loss": 0.6175607442855835 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.17379038035869598, - "train/contrastive_loss": 1.9151513576507568, - "train/negative_loss": 0.8624277114868164, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0527236461639404, - "train/total_loss": 0.5568206310272217 + "train/classification_loss": 0.25880903005599976, + "train/contrastive_loss": 3.44437837600708, + "train/negative_loss": 1.8525596857070923, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.5918185710906982, + "train/total_loss": 0.9476847052574158 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.20843183994293213, - "train/contrastive_loss": 2.237791061401367, - "train/negative_loss": 1.3298166990280151, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9079742431640625, - "train/total_loss": 0.6559900641441345 + "train/classification_loss": 0.12664580345153809, + "train/contrastive_loss": 0.6547762751579285, + "train/negative_loss": 0.6209471225738525, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.03382916375994682, + "train/total_loss": 0.2576010823249817 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1401105523109436, - "train/contrastive_loss": 1.5313498973846436, - "train/negative_loss": 0.6408353447914124, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.8905145525932312, - "train/total_loss": 0.44638052582740784 + "train/classification_loss": 0.2125016748905182, + "train/contrastive_loss": 2.5967750549316406, + "train/negative_loss": 2.051178455352783, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.5455965995788574, + "train/total_loss": 0.7318567037582397 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.19562679529190063, - "train/contrastive_loss": 2.7837634086608887, - "train/negative_loss": 1.6119648218154907, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.1717987060546875, - "train/total_loss": 0.7523794770240784 + "train/classification_loss": 0.19362123310565948, + "train/contrastive_loss": 2.632143259048462, + "train/negative_loss": 1.5997766256332397, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0323666334152222, + "train/total_loss": 0.7200498580932617 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.23364757001399994, - "train/contrastive_loss": 2.0445809364318848, - "train/negative_loss": 0.9854739904403687, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.0591069459915161, - "train/total_loss": 0.6425637602806091 + "train/classification_loss": 0.20858298242092133, + "train/contrastive_loss": 1.524407982826233, + "train/negative_loss": 1.1166682243347168, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.4077397286891937, + "train/total_loss": 0.5134645700454712 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1745101511478424, - "train/contrastive_loss": 1.687099814414978, - "train/negative_loss": 1.262963056564331, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.424136757850647, - "train/total_loss": 0.5119301080703735 + "train/classification_loss": 0.21285325288772583, + "train/contrastive_loss": 1.9451953172683716, + "train/negative_loss": 1.9451572895050049, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 3.802848732448183e-05, + "train/total_loss": 0.601892352104187 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.15578649938106537, - "train/contrastive_loss": 1.375629186630249, - "train/negative_loss": 0.989414393901825, + "train/classification_loss": 0.1049819067120552, + "train/contrastive_loss": 0.36691170930862427, + "train/negative_loss": 0.3426990211009979, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.38621485233306885, - "train/total_loss": 0.4309123158454895 + "train/positive_loss": 0.024212701246142387, + "train/total_loss": 0.17836424708366394 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2770358622074127, - "train/contrastive_loss": 2.566657066345215, - "train/negative_loss": 1.3372126817703247, + "train/classification_loss": 0.1960151195526123, + "train/contrastive_loss": 2.0619232654571533, + "train/negative_loss": 0.9810680747032166, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2294443845748901, - "train/total_loss": 0.7903672456741333 + "train/num_positives": 14, + "train/positive_loss": 1.0808552503585815, + "train/total_loss": 0.6083997488021851 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.20463621616363525, - "train/contrastive_loss": 2.4228434562683105, - "train/negative_loss": 1.7969471216201782, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6258963346481323, - "train/total_loss": 0.6892049312591553 + "train/classification_loss": 0.15617330372333527, + "train/contrastive_loss": 1.9075117111206055, + "train/negative_loss": 0.790858805179596, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.1166529655456543, + "train/total_loss": 0.537675678730011 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.11976135522127151, - "train/contrastive_loss": 0.9961673021316528, - "train/negative_loss": 0.3578493595123291, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.6383179426193237, - "train/total_loss": 0.31899482011795044 + "train/classification_loss": 0.1824103146791458, + "train/contrastive_loss": 3.035715103149414, + "train/negative_loss": 1.5830165147781372, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.4526987075805664, + "train/total_loss": 0.7895533442497253 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1979885697364807, - "train/contrastive_loss": 2.4924674034118652, - "train/negative_loss": 1.990096926689148, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5023705363273621, - "train/total_loss": 0.6964820623397827 + "train/classification_loss": 0.20614732801914215, + "train/contrastive_loss": 3.8229174613952637, + "train/negative_loss": 1.84385085105896, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.9790666103363037, + "train/total_loss": 0.9707308411598206 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.12204289436340332, - "train/contrastive_loss": 0.7213383913040161, - "train/negative_loss": 0.7212517857551575, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 8.66230548126623e-05, - "train/total_loss": 0.26631057262420654 + "train/classification_loss": 0.17775031924247742, + "train/contrastive_loss": 1.8375892639160156, + "train/negative_loss": 1.0210528373718262, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.8165364861488342, + "train/total_loss": 0.545268177986145 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.13353750109672546, - "train/contrastive_loss": 1.656617283821106, - "train/negative_loss": 1.5821499824523926, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.07446733862161636, - "train/total_loss": 0.4648609757423401 + "train/classification_loss": 0.14816974103450775, + "train/contrastive_loss": 2.6717758178710938, + "train/negative_loss": 0.7289735674858093, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.9428021907806396, + "train/total_loss": 0.6825249195098877 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.14591483771800995, - "train/contrastive_loss": 1.2703533172607422, - "train/negative_loss": 0.6629962921142578, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.6073570847511292, - "train/total_loss": 0.39998549222946167 + "train/classification_loss": 0.16398699581623077, + "train/contrastive_loss": 0.9612963199615479, + "train/negative_loss": 0.48294222354888916, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.4783541262149811, + "train/total_loss": 0.3562462627887726 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.23275414109230042, - "train/contrastive_loss": 2.7202367782592773, - "train/negative_loss": 2.023674726486206, - "train/num_negatives": 40, + "train/classification_loss": 0.13100416958332062, + "train/contrastive_loss": 1.0867034196853638, + "train/negative_loss": 0.35729482769966125, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.6965619921684265, - "train/total_loss": 0.7768014669418335 + "train/positive_loss": 0.7294086217880249, + "train/total_loss": 0.3483448624610901 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.17720089852809906, - "train/contrastive_loss": 0.9427557587623596, - "train/negative_loss": 0.28303438425064087, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.6597213745117188, - "train/total_loss": 0.36575204133987427 + "train/classification_loss": 0.20591473579406738, + "train/contrastive_loss": 1.6879944801330566, + "train/negative_loss": 0.47784149646759033, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.2101529836654663, + "train/total_loss": 0.5435136556625366 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.17468976974487305, - "train/contrastive_loss": 0.8298830389976501, - "train/negative_loss": 0.8217445015907288, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.00813851784914732, - "train/total_loss": 0.34066638350486755 + "train/classification_loss": 0.15839135646820068, + "train/contrastive_loss": 0.7127677202224731, + "train/negative_loss": 0.5803985595703125, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.13236914575099945, + "train/total_loss": 0.3009449243545532 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.15209226310253143, - "train/contrastive_loss": 1.3479893207550049, - "train/negative_loss": 1.121045470237732, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.22694388031959534, - "train/total_loss": 0.42169010639190674 + "train/classification_loss": 0.19651007652282715, + "train/contrastive_loss": 3.902580738067627, + "train/negative_loss": 1.6494033336639404, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.2531774044036865, + "train/total_loss": 0.9770262241363525 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.24577617645263672, - "train/contrastive_loss": 1.8470311164855957, - "train/negative_loss": 0.25832998752593994, - "train/num_negatives": 44, + "train/classification_loss": 0.15365880727767944, + "train/contrastive_loss": 2.353194236755371, + "train/negative_loss": 2.1736857891082764, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.5887011289596558, - "train/total_loss": 0.6151823997497559 + "train/positive_loss": 0.17950856685638428, + "train/total_loss": 0.6242976188659668 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.27399805188179016, - "train/contrastive_loss": 1.9788891077041626, - "train/negative_loss": 1.6002839803695679, - "train/num_negatives": 44, + "train/classification_loss": 0.12539084255695343, + "train/contrastive_loss": 2.483067035675049, + "train/negative_loss": 1.8802618980407715, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.3786051273345947, - "train/total_loss": 0.6697758436203003 + "train/positive_loss": 0.6028050184249878, + "train/total_loss": 0.6220042705535889 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.14895671606063843, - "train/contrastive_loss": 1.7838791608810425, - "train/negative_loss": 0.38404572010040283, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.3998334407806396, - "train/total_loss": 0.505732536315918 + "train/classification_loss": 0.17275339365005493, + "train/contrastive_loss": 2.908426523208618, + "train/negative_loss": 1.844923973083496, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.063502550125122, + "train/total_loss": 0.7544386982917786 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.13669613003730774, - "train/contrastive_loss": 0.7987115383148193, - "train/negative_loss": 0.3135432302951813, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.4851682782173157, - "train/total_loss": 0.29643845558166504 + "train/classification_loss": 0.2464851438999176, + "train/contrastive_loss": 2.5663833618164062, + "train/negative_loss": 1.0961732864379883, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.470210075378418, + "train/total_loss": 0.7597618103027344 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.10292065888643265, - "train/contrastive_loss": 0.9347813725471497, - "train/negative_loss": 0.388984739780426, + "train/classification_loss": 0.19305849075317383, + "train/contrastive_loss": 3.053581476211548, + "train/negative_loss": 0.7467369437217712, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5457966327667236, - "train/total_loss": 0.28987693786621094 + "train/num_positives": 10, + "train/positive_loss": 2.306844472885132, + "train/total_loss": 0.8037747740745544 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.27912813425064087, - "train/contrastive_loss": 1.5402354001998901, - "train/negative_loss": 0.31652846932411194, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2237069606781006, - "train/total_loss": 0.5871752500534058 + "train/classification_loss": 0.2186601161956787, + "train/contrastive_loss": 3.229010820388794, + "train/negative_loss": 2.1998815536499023, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0291292667388916, + "train/total_loss": 0.8644623160362244 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.25827136635780334, - "train/contrastive_loss": 2.959677219390869, - "train/negative_loss": 1.520568609237671, + "train/classification_loss": 0.19897770881652832, + "train/contrastive_loss": 1.5801575183868408, + "train/negative_loss": 1.565502643585205, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.4391086101531982, - "train/total_loss": 0.8502068519592285 + "train/num_positives": 4, + "train/positive_loss": 0.014654901809990406, + "train/total_loss": 0.5150092244148254 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1970413774251938, - "train/contrastive_loss": 3.36331844329834, - "train/negative_loss": 2.6963775157928467, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.6669408082962036, - "train/total_loss": 0.869705080986023 + "train/classification_loss": 0.17531105875968933, + "train/contrastive_loss": 0.21678856015205383, + "train/negative_loss": 0.20787391066551208, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.008914647623896599, + "train/total_loss": 0.21866877377033234 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1953045129776001, - "train/contrastive_loss": 1.3170843124389648, - "train/negative_loss": 0.8244885802268982, - "train/num_negatives": 40, + "train/classification_loss": 0.2555426061153412, + "train/contrastive_loss": 2.9623093605041504, + "train/negative_loss": 1.7703056335449219, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.4925956726074219, - "train/total_loss": 0.4587213695049286 + "train/positive_loss": 1.192003607749939, + "train/total_loss": 0.8480044603347778 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2165527492761612, - "train/contrastive_loss": 1.8632102012634277, - "train/negative_loss": 1.5494983196258545, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.31371191143989563, - "train/total_loss": 0.5891947746276855 + "train/classification_loss": 0.2015833854675293, + "train/contrastive_loss": 0.5235978960990906, + "train/negative_loss": 0.5213149785995483, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.002282913774251938, + "train/total_loss": 0.3063029646873474 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1384197622537613, - "train/contrastive_loss": 1.6589069366455078, - "train/negative_loss": 0.9867913722991943, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.6721155047416687, - "train/total_loss": 0.47020113468170166 + "train/classification_loss": 0.16498155891895294, + "train/contrastive_loss": 1.116623878479004, + "train/negative_loss": 1.1126141548156738, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.004009678494185209, + "train/total_loss": 0.38830631971359253 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.22079268097877502, - "train/contrastive_loss": 1.6202327013015747, - "train/negative_loss": 1.0597813129425049, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.5604513883590698, - "train/total_loss": 0.5448392629623413 + "train/classification_loss": 0.16207949817180634, + "train/contrastive_loss": 2.4319911003112793, + "train/negative_loss": 1.3011422157287598, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.130849003791809, + "train/total_loss": 0.6484777331352234 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.27488085627555847, - "train/contrastive_loss": 1.2833298444747925, - "train/negative_loss": 1.2825957536697388, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007340621668845415, - "train/total_loss": 0.5315468311309814 + "train/classification_loss": 0.1915922313928604, + "train/contrastive_loss": 1.2845745086669922, + "train/negative_loss": 0.7174274325370789, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5671471357345581, + "train/total_loss": 0.4485071301460266 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1852637678384781, - "train/contrastive_loss": 1.301331639289856, - "train/negative_loss": 1.183530569076538, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.11780103296041489, - "train/total_loss": 0.44553011655807495 + "train/classification_loss": 0.21791309118270874, + "train/contrastive_loss": 2.680976629257202, + "train/negative_loss": 2.04085111618042, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.6401254534721375, + "train/total_loss": 0.7541084289550781 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1703890711069107, - "train/contrastive_loss": 2.6556034088134766, - "train/negative_loss": 1.6441160440444946, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.0114872455596924, - "train/total_loss": 0.7015097737312317 + "train/classification_loss": 0.22994616627693176, + "train/contrastive_loss": 2.007884979248047, + "train/negative_loss": 1.3865667581558228, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6213181614875793, + "train/total_loss": 0.6315231323242188 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1802481710910797, - "train/contrastive_loss": 3.514472007751465, - "train/negative_loss": 1.6832563877105713, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.831215500831604, - "train/total_loss": 0.8831425905227661 + "train/classification_loss": 0.1472579389810562, + "train/contrastive_loss": 2.277780294418335, + "train/negative_loss": 2.277631998062134, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.00014824021491222084, + "train/total_loss": 0.6028140187263489 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1537477821111679, - "train/contrastive_loss": 1.2966372966766357, - "train/negative_loss": 0.8525386452674866, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.44409871101379395, - "train/total_loss": 0.4130752682685852 + "train/classification_loss": 0.18912053108215332, + "train/contrastive_loss": 1.2177939414978027, + "train/negative_loss": 0.8141074776649475, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 0.40368643403053284, + "train/total_loss": 0.43267932534217834 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.17157655954360962, - "train/contrastive_loss": 0.8540363907814026, - "train/negative_loss": 0.8522709012031555, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.0017654973780736327, - "train/total_loss": 0.34238386154174805 + "train/classification_loss": 0.23758885264396667, + "train/contrastive_loss": 2.508648157119751, + "train/negative_loss": 2.180753469467163, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.3278946280479431, + "train/total_loss": 0.7393184900283813 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.19874049723148346, - "train/contrastive_loss": 0.7918590307235718, - "train/negative_loss": 0.783258855342865, - "train/num_negatives": 46, + "train/classification_loss": 0.20018039643764496, + "train/contrastive_loss": 1.1913447380065918, + "train/negative_loss": 0.5931902527809143, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.5981545448303223, + "train/total_loss": 0.43844935297966003 + }, + { + "epoch": 7.746478873239437, + "step": 2200, + "train/classification_loss": 0.2322784960269928, + "train/contrastive_loss": 4.559499740600586, + "train/negative_loss": 1.970737338066101, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.008600180968642235, - "train/total_loss": 0.3571122884750366 + "train/positive_loss": 2.5887622833251953, + "train/total_loss": 1.1441785097122192 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2013775259256363, - "train/contrastive_loss": 2.203746795654297, - "train/negative_loss": 2.133307456970215, + "train/classification_loss": 0.14572544395923615, + "train/contrastive_loss": 1.8016914129257202, + "train/negative_loss": 0.6206285953521729, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.07043930143117905, - "train/total_loss": 0.6421269178390503 + "train/num_positives": 10, + "train/positive_loss": 1.1810628175735474, + "train/total_loss": 0.5060637593269348 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1799197494983673, - "train/contrastive_loss": 1.060455560684204, - "train/negative_loss": 1.059705138206482, + "train/classification_loss": 0.20211629569530487, + "train/contrastive_loss": 3.5900676250457764, + "train/negative_loss": 1.8990634679794312, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.6910041570663452, + "train/total_loss": 0.9201298356056213 + }, + { + "epoch": 7.746478873239437, + "step": 2200, + "train/classification_loss": 0.17881852388381958, + "train/contrastive_loss": 1.219581961631775, + "train/negative_loss": 1.2170060873031616, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0025759157724678516, + "train/total_loss": 0.42273491621017456 + }, + { + "epoch": 7.746478873239437, + "step": 2200, + "train/classification_loss": 0.24955160915851593, + "train/contrastive_loss": 1.1467219591140747, + "train/negative_loss": 1.0726075172424316, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.0007504014065489173, - "train/total_loss": 0.3920108675956726 + "train/positive_loss": 0.07411445677280426, + "train/total_loss": 0.47889602184295654 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.20317992568016052, - "train/contrastive_loss": 3.1517133712768555, - "train/negative_loss": 2.327582597732544, - "train/num_negatives": 36, + "train/classification_loss": 0.17249681055545807, + "train/contrastive_loss": 0.6076031923294067, + "train/negative_loss": 0.5369259715080261, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.07067721337080002, + "train/total_loss": 0.2940174341201782 + }, + { + "epoch": 7.746478873239437, + "step": 2200, + "train/classification_loss": 0.32010331749916077, + "train/contrastive_loss": 2.603621244430542, + "train/negative_loss": 1.6959607601165771, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.8241308927536011, - "train/total_loss": 0.8335225582122803 + "train/positive_loss": 0.9076604843139648, + "train/total_loss": 0.8408275842666626 + }, + { + "epoch": 7.746478873239437, + "step": 2200, + "train/classification_loss": 0.16025418043136597, + "train/contrastive_loss": 1.9934375286102295, + "train/negative_loss": 1.0865634679794312, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9068740606307983, + "train/total_loss": 0.5589417219161987 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2142106145620346, - "train/contrastive_loss": 0.9611688256263733, - "train/negative_loss": 0.7391939759254456, + "train/classification_loss": 0.19057223200798035, + "train/contrastive_loss": 2.7621850967407227, + "train/negative_loss": 2.4370157718658447, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.22197483479976654, - "train/total_loss": 0.40644437074661255 + "train/num_positives": 14, + "train/positive_loss": 0.3251693844795227, + "train/total_loss": 0.7430092096328735 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1564994603395462, - "train/contrastive_loss": 2.0154950618743896, - "train/negative_loss": 1.5570170879364014, + "train/classification_loss": 0.24548520147800446, + "train/contrastive_loss": 2.1916701793670654, + "train/negative_loss": 2.191657543182373, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.45847803354263306, - "train/total_loss": 0.5595985054969788 + "train/num_positives": 2, + "train/positive_loss": 1.2517053619376384e-05, + "train/total_loss": 0.6838192343711853 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.15486465394496918, - "train/contrastive_loss": 1.8358418941497803, - "train/negative_loss": 0.9644298553466797, + "train/classification_loss": 0.1856653392314911, + "train/contrastive_loss": 2.384842872619629, + "train/negative_loss": 1.2399189472198486, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8714120984077454, - "train/total_loss": 0.5220330357551575 + "train/num_positives": 16, + "train/positive_loss": 1.1449238061904907, + "train/total_loss": 0.6626338958740234 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.26276373863220215, - "train/contrastive_loss": 1.5910183191299438, - "train/negative_loss": 1.1173884868621826, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.47362983226776123, - "train/total_loss": 0.5809674263000488 + "train/classification_loss": 0.14005175232887268, + "train/contrastive_loss": 0.5830338001251221, + "train/negative_loss": 0.20902292430400848, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.3740108907222748, + "train/total_loss": 0.25665852427482605 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.11615364998579025, - "train/contrastive_loss": 0.5229880213737488, - "train/negative_loss": 0.4901016354560852, - "train/num_negatives": 48, + "train/classification_loss": 0.20500682294368744, + "train/contrastive_loss": 0.9195634126663208, + "train/negative_loss": 0.9051429033279419, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 0.03288636356592178, - "train/total_loss": 0.22075125575065613 + "train/positive_loss": 0.014420506544411182, + "train/total_loss": 0.38891950249671936 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.14049400389194489, - "train/contrastive_loss": 0.40658193826675415, - "train/negative_loss": 0.17742277681827545, + "train/classification_loss": 0.20003816485404968, + "train/contrastive_loss": 1.102660894393921, + "train/negative_loss": 0.8248953819274902, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.2291591614484787, - "train/total_loss": 0.22181040048599243 + "train/num_positives": 14, + "train/positive_loss": 0.27776557207107544, + "train/total_loss": 0.42057034373283386 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.11487066000699997, - "train/contrastive_loss": 0.775407612323761, - "train/negative_loss": 0.7665122151374817, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.008895425125956535, - "train/total_loss": 0.2699521780014038 + "train/classification_loss": 0.30356451869010925, + "train/contrastive_loss": 3.1805849075317383, + "train/negative_loss": 1.5772780179977417, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.603306770324707, + "train/total_loss": 0.9396815299987793 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.19876199960708618, - "train/contrastive_loss": 1.4561779499053955, - "train/negative_loss": 0.3854422867298126, - "train/num_negatives": 28, + "train/classification_loss": 0.13979889452457428, + "train/contrastive_loss": 0.9882224798202515, + "train/negative_loss": 0.35013994574546814, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 1.0707356929779053, - "train/total_loss": 0.48999759554862976 + "train/positive_loss": 0.6380825042724609, + "train/total_loss": 0.33744341135025024 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.15280713140964508, - "train/contrastive_loss": 1.5872092247009277, - "train/negative_loss": 0.7175924777984619, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.869616687297821, - "train/total_loss": 0.4702489972114563 + "train/classification_loss": 0.1323823183774948, + "train/contrastive_loss": 0.7261881232261658, + "train/negative_loss": 0.29895681142807007, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.4272313117980957, + "train/total_loss": 0.27761995792388916 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.16472168266773224, - "train/contrastive_loss": 0.5010542273521423, - "train/negative_loss": 0.44847044348716736, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.05258379504084587, - "train/total_loss": 0.2649325132369995 + "train/classification_loss": 0.16428159177303314, + "train/contrastive_loss": 2.120096206665039, + "train/negative_loss": 0.7873652577400208, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.3327308893203735, + "train/total_loss": 0.5883008241653442 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2247283011674881, - "train/contrastive_loss": 2.2589402198791504, - "train/negative_loss": 0.8531327247619629, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.405807375907898, - "train/total_loss": 0.6765163540840149 + "train/classification_loss": 0.2014031857252121, + "train/contrastive_loss": 2.4253745079040527, + "train/negative_loss": 1.2768518924713135, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.1485224962234497, + "train/total_loss": 0.6864780783653259 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.23302701115608215, - "train/contrastive_loss": 2.0726609230041504, - "train/negative_loss": 0.8081550598144531, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.2645058631896973, - "train/total_loss": 0.6475591659545898 + "train/classification_loss": 0.2026602178812027, + "train/contrastive_loss": 0.9674946665763855, + "train/negative_loss": 0.6935701966285706, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.27392446994781494, + "train/total_loss": 0.39615917205810547 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.19432538747787476, - "train/contrastive_loss": 1.1343895196914673, - "train/negative_loss": 0.4197683036327362, + "train/classification_loss": 0.1142815425992012, + "train/contrastive_loss": 0.11571035534143448, + "train/negative_loss": 0.10615988075733185, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.7146211862564087, - "train/total_loss": 0.4212033152580261 + "train/num_positives": 16, + "train/positive_loss": 0.00955047644674778, + "train/total_loss": 0.13742361962795258 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.15825487673282623, - "train/contrastive_loss": 2.32011079788208, - "train/negative_loss": 1.7314465045928955, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5886642932891846, - "train/total_loss": 0.622277021408081 + "train/classification_loss": 0.18858285248279572, + "train/contrastive_loss": 2.473759412765503, + "train/negative_loss": 1.0796419382095337, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.3941174745559692, + "train/total_loss": 0.6833347678184509 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.24592669308185577, - "train/contrastive_loss": 2.7062840461730957, - "train/negative_loss": 1.460045576095581, + "train/classification_loss": 0.24107052385807037, + "train/contrastive_loss": 2.9323906898498535, + "train/negative_loss": 1.4752857685089111, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.2462385892868042, - "train/total_loss": 0.7871835231781006 + "train/num_positives": 2, + "train/positive_loss": 1.4571049213409424, + "train/total_loss": 0.8275486826896667 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.22029834985733032, - "train/contrastive_loss": 2.8271827697753906, - "train/negative_loss": 1.6463921070098877, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.180790662765503, - "train/total_loss": 0.7857348918914795 + "train/classification_loss": 0.14782081544399261, + "train/contrastive_loss": 2.7027158737182617, + "train/negative_loss": 1.2966796159744263, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.406036376953125, + "train/total_loss": 0.6883640289306641 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.18098047375679016, - "train/contrastive_loss": 2.5872645378112793, - "train/negative_loss": 1.4547581672668457, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.132506251335144, - "train/total_loss": 0.6984333992004395 + "train/classification_loss": 0.18904618918895721, + "train/contrastive_loss": 1.1094850301742554, + "train/negative_loss": 0.8641249537467957, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.24536004662513733, + "train/total_loss": 0.4109432101249695 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2019614279270172, - "train/contrastive_loss": 2.4925613403320312, - "train/negative_loss": 1.620702862739563, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.8718584179878235, - "train/total_loss": 0.7004736661911011 + "train/classification_loss": 0.19876940548419952, + "train/contrastive_loss": 2.6384170055389404, + "train/negative_loss": 1.0102717876434326, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.6281452178955078, + "train/total_loss": 0.7264528274536133 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2169322818517685, - "train/contrastive_loss": 1.5056066513061523, - "train/negative_loss": 0.4353627562522888, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0702438354492188, - "train/total_loss": 0.5180535912513733 + "train/classification_loss": 0.171685129404068, + "train/contrastive_loss": 3.6967501640319824, + "train/negative_loss": 3.696747303009033, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.849109705493902e-06, + "train/total_loss": 0.9110351800918579 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.24636119604110718, - "train/contrastive_loss": 3.1300458908081055, - "train/negative_loss": 1.4358484745025635, + "train/classification_loss": 0.18085412681102753, + "train/contrastive_loss": 1.8239394426345825, + "train/negative_loss": 0.6054428815841675, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.6941975355148315, - "train/total_loss": 0.8723703622817993 + "train/positive_loss": 1.218496561050415, + "train/total_loss": 0.5456420183181763 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1675446778535843, - "train/contrastive_loss": 0.5796648859977722, - "train/negative_loss": 0.5778061747550964, + "train/classification_loss": 0.21124012768268585, + "train/contrastive_loss": 2.7942728996276855, + "train/negative_loss": 1.3598989248275757, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0018587025115266442, - "train/total_loss": 0.28347766399383545 + "train/num_positives": 8, + "train/positive_loss": 1.4343738555908203, + "train/total_loss": 0.7700946927070618 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1612347513437271, - "train/contrastive_loss": 1.3028966188430786, - "train/negative_loss": 0.7380688190460205, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5648277997970581, - "train/total_loss": 0.42181408405303955 + "train/classification_loss": 0.16738319396972656, + "train/contrastive_loss": 3.5876283645629883, + "train/negative_loss": 1.4816099405288696, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.106018543243408, + "train/total_loss": 0.8849088549613953 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.14656195044517517, - "train/contrastive_loss": 1.462990403175354, - "train/negative_loss": 0.42768430709838867, - "train/num_negatives": 46, + "train/classification_loss": 0.26058894395828247, + "train/contrastive_loss": 2.2595388889312744, + "train/negative_loss": 1.5896544456481934, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0353060960769653, - "train/total_loss": 0.4391600489616394 + "train/positive_loss": 0.6698843836784363, + "train/total_loss": 0.7124967575073242 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.2371242791414261, - "train/contrastive_loss": 1.5739837884902954, - "train/negative_loss": 1.5739837884902954, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5519210696220398 - }, - { - "epoch": 8.365019011406844, - "eval_exact_match_accuracy": 0.2704761904761905, - "eval_hamming_loss": 0.06991596638655462, - "eval_loss": 0.5396168231964111, - "eval_macro_f1": 0.25310809620536184, - "eval_macro_precision": 0.5272363609733852, - "eval_macro_recall": 0.18595876864645505, - "eval_micro_f1": 0.5023923444976076, - "eval_micro_precision": 0.84, - "eval_micro_recall": 0.3583617747440273, - "eval_runtime": 2.6229, - "eval_samples_per_second": 200.16, - "eval_steps_per_second": 25.163, + "train/classification_loss": 0.16976019740104675, + "train/contrastive_loss": 0.4422369599342346, + "train/negative_loss": 0.39408010244369507, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.04815686121582985, + "train/total_loss": 0.2582075893878937 + }, + { + "epoch": 7.746478873239437, + "eval_exact_match_accuracy": 0.27336860670194, + "eval_hamming_loss": 0.0706504824151883, + "eval_loss": 0.598036527633667, + "eval_macro_f1": 0.31422932723861985, + "eval_macro_precision": 0.5684405947030052, + "eval_macro_recall": 0.24597270648439978, + "eval_micro_f1": 0.5047272727272727, + "eval_micro_precision": 0.7940503432494279, + "eval_micro_recall": 0.3699360341151386, + "eval_runtime": 2.842, + "eval_samples_per_second": 199.507, + "eval_steps_per_second": 24.982, "step": 2200 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1381554901599884, - "train/contrastive_loss": 1.3074227571487427, - "train/negative_loss": 0.8569817543029785, + "train/classification_loss": 0.12398000061511993, + "train/contrastive_loss": 1.5109673738479614, + "train/negative_loss": 0.7682982087135315, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.45044103264808655, - "train/total_loss": 0.3996400535106659 + "train/positive_loss": 0.7426691651344299, + "train/total_loss": 0.42617350816726685 }, { - "epoch": 8.365019011406844, + "epoch": 7.746478873239437, "step": 2200, - "train/classification_loss": 0.1319269984960556, - "train/contrastive_loss": 0.6194708347320557, - "train/negative_loss": 0.5880257487297058, + "train/classification_loss": 0.220085009932518, + "train/contrastive_loss": 2.30934476852417, + "train/negative_loss": 0.9126915335655212, "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.03144511580467224, - "train/total_loss": 0.255821168422699 + "train/positive_loss": 1.3966532945632935, + "train/total_loss": 0.6819539666175842 }, { - "epoch": 8.55513307984791, - "grad_norm": 6.365290641784668, - "learning_rate": 1.9673211567732117e-05, - "loss": 0.6793, + "epoch": 7.922535211267606, + "grad_norm": 21.52375602722168, + "learning_rate": 1.969753347427766e-05, + "loss": 0.7352, "step": 2250 }, { - "epoch": 8.55513307984791, + "epoch": 7.922535211267606, "step": 2250, - "train/classification_loss": 0.17412221431732178, - "train/contrastive_loss": 0.4739062786102295, - "train/negative_loss": 0.37623485922813416, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.09767141193151474, - "train/total_loss": 0.2689034640789032 + "train/classification_loss": 0.1502661257982254, + "train/contrastive_loss": 0.4690514802932739, + "train/negative_loss": 0.36362096667289734, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.10543051362037659, + "train/total_loss": 0.2440764307975769 }, { - "epoch": 8.55513307984791, + "epoch": 7.922535211267606, "step": 2250, - "train/classification_loss": 0.1655305176973343, - "train/contrastive_loss": 0.7931451797485352, - "train/negative_loss": 0.6361735463142395, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.15697163343429565, - "train/total_loss": 0.32415956258773804 + "train/classification_loss": 0.14285258948802948, + "train/contrastive_loss": 0.36563462018966675, + "train/negative_loss": 0.35940900444984436, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.00622561713680625, + "train/total_loss": 0.21597951650619507 }, { - "epoch": 8.745247148288973, - "grad_norm": 6.3515625, - "learning_rate": 1.9665601217656015e-05, - "loss": 0.7131, + "epoch": 8.098591549295774, + "grad_norm": 6.245151519775391, + "learning_rate": 1.969048625792812e-05, + "loss": 0.6935, "step": 2300 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.25564149022102356, - "train/contrastive_loss": 1.6840431690216064, - "train/negative_loss": 0.879407525062561, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8046356439590454, - "train/total_loss": 0.5924501419067383 + "train/classification_loss": 0.2442706674337387, + "train/contrastive_loss": 2.3785529136657715, + "train/negative_loss": 1.3433853387832642, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0351674556732178, + "train/total_loss": 0.7199812531471252 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.213272362947464, - "train/contrastive_loss": 2.1640923023223877, - "train/negative_loss": 1.2412561178207397, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.9228361248970032, - "train/total_loss": 0.6460908651351929 + "train/classification_loss": 0.2727251350879669, + "train/contrastive_loss": 1.3389389514923096, + "train/negative_loss": 0.6907218098640442, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6482172012329102, + "train/total_loss": 0.5405129194259644 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1685238778591156, - "train/contrastive_loss": 1.6907427310943604, - "train/negative_loss": 0.5414727330207825, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1492700576782227, - "train/total_loss": 0.5066724419593811 + "train/classification_loss": 0.25447356700897217, + "train/contrastive_loss": 2.2609119415283203, + "train/negative_loss": 1.1106691360473633, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1502426862716675, + "train/total_loss": 0.7066559791564941 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.18707427382469177, - "train/contrastive_loss": 2.953325033187866, - "train/negative_loss": 1.7318259477615356, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2214990854263306, - "train/total_loss": 0.7777392864227295 + "train/classification_loss": 0.1366354376077652, + "train/contrastive_loss": 2.00216007232666, + "train/negative_loss": 1.5390781164169312, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.46308207511901855, + "train/total_loss": 0.5370674729347229 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.14191240072250366, - "train/contrastive_loss": 1.946249008178711, - "train/negative_loss": 1.4570705890655518, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.48917844891548157, - "train/total_loss": 0.5311622023582458 + "train/classification_loss": 0.19932346045970917, + "train/contrastive_loss": 2.6040477752685547, + "train/negative_loss": 2.457207679748535, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.14684009552001953, + "train/total_loss": 0.7201330661773682 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1956971436738968, - "train/contrastive_loss": 2.24814510345459, - "train/negative_loss": 1.1229557991027832, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.1251893043518066, - "train/total_loss": 0.6453261971473694 + "train/classification_loss": 0.20630595088005066, + "train/contrastive_loss": 2.2803642749786377, + "train/negative_loss": 1.6419827938079834, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6383814215660095, + "train/total_loss": 0.6623787879943848 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.21184144914150238, - "train/contrastive_loss": 1.7972759008407593, - "train/negative_loss": 1.2061266899108887, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.5911492109298706, - "train/total_loss": 0.5712966322898865 + "train/classification_loss": 0.18988202512264252, + "train/contrastive_loss": 1.6799254417419434, + "train/negative_loss": 0.996150016784668, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.6837754845619202, + "train/total_loss": 0.5258671045303345 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15167707204818726, - "train/contrastive_loss": 1.8371989727020264, - "train/negative_loss": 1.2461752891540527, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5910236239433289, - "train/total_loss": 0.5191168785095215 + "train/classification_loss": 0.218847393989563, + "train/contrastive_loss": 1.7794795036315918, + "train/negative_loss": 1.7788747549057007, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00060469307936728, + "train/total_loss": 0.5747432708740234 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15198364853858948, - "train/contrastive_loss": 1.8961825370788574, - "train/negative_loss": 1.3115285634994507, + "train/classification_loss": 0.10503634065389633, + "train/contrastive_loss": 0.46098262071609497, + "train/negative_loss": 0.3858431279659271, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.5846539735794067, - "train/total_loss": 0.5312201976776123 + "train/positive_loss": 0.07513950765132904, + "train/total_loss": 0.19723287224769592 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.307724267244339, - "train/contrastive_loss": 2.938387393951416, - "train/negative_loss": 1.4973338842391968, + "train/classification_loss": 0.18408505618572235, + "train/contrastive_loss": 1.5874762535095215, + "train/negative_loss": 1.101678729057312, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4410535097122192, - "train/total_loss": 0.8954017162322998 + "train/num_positives": 14, + "train/positive_loss": 0.48579755425453186, + "train/total_loss": 0.5015802979469299 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.17580287158489227, - "train/contrastive_loss": 1.4024055004119873, - "train/negative_loss": 1.1170488595962524, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.2853566110134125, - "train/total_loss": 0.4562839865684509 + "train/classification_loss": 0.1481398195028305, + "train/contrastive_loss": 1.0276883840560913, + "train/negative_loss": 0.9641227722167969, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.06356561928987503, + "train/total_loss": 0.35367751121520996 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.11936670541763306, - "train/contrastive_loss": 0.9668710231781006, - "train/negative_loss": 0.4054192006587982, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.56145179271698, - "train/total_loss": 0.31274092197418213 + "train/classification_loss": 0.18674065172672272, + "train/contrastive_loss": 1.9973684549331665, + "train/negative_loss": 1.9967641830444336, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.0006042941240593791, + "train/total_loss": 0.5862143635749817 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.187508225440979, - "train/contrastive_loss": 2.7959744930267334, - "train/negative_loss": 2.094265937805176, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7017084956169128, - "train/total_loss": 0.7467031478881836 + "train/classification_loss": 0.21244896948337555, + "train/contrastive_loss": 3.3329052925109863, + "train/negative_loss": 2.1440296173095703, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.1888757944107056, + "train/total_loss": 0.8790300488471985 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.13271595537662506, - "train/contrastive_loss": 2.142529010772705, - "train/negative_loss": 2.105534791946411, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.036994270980358124, - "train/total_loss": 0.5612217783927917 + "train/classification_loss": 0.1680147498846054, + "train/contrastive_loss": 0.9330901503562927, + "train/negative_loss": 0.8515809178352356, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.08150923997163773, + "train/total_loss": 0.35463279485702515 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1331949234008789, - "train/contrastive_loss": 2.667973518371582, - "train/negative_loss": 1.2202417850494385, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.447731852531433, - "train/total_loss": 0.6667896509170532 + "train/classification_loss": 0.13100989162921906, + "train/contrastive_loss": 2.4437777996063232, + "train/negative_loss": 0.763271152973175, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.680506706237793, + "train/total_loss": 0.6197654604911804 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15100054442882538, - "train/contrastive_loss": 0.5283867120742798, - "train/negative_loss": 0.4459571838378906, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.08242954313755035, - "train/total_loss": 0.25667789578437805 + "train/classification_loss": 0.16607040166854858, + "train/contrastive_loss": 1.2120912075042725, + "train/negative_loss": 0.7495582103729248, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.46253302693367004, + "train/total_loss": 0.4084886312484741 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.21924848854541779, - "train/contrastive_loss": 2.4521141052246094, - "train/negative_loss": 1.7866642475128174, - "train/num_negatives": 40, + "train/classification_loss": 0.12100114673376083, + "train/contrastive_loss": 1.183854579925537, + "train/negative_loss": 0.6361507177352905, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.6654497981071472, - "train/total_loss": 0.7096713185310364 + "train/positive_loss": 0.5477039217948914, + "train/total_loss": 0.3577720522880554 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1666816920042038, - "train/contrastive_loss": 0.7052980661392212, - "train/negative_loss": 0.2530880570411682, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.452210009098053, - "train/total_loss": 0.30774131417274475 + "train/classification_loss": 0.18046681582927704, + "train/contrastive_loss": 0.9073315858840942, + "train/negative_loss": 0.5911673307418823, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.3161642849445343, + "train/total_loss": 0.3619331419467926 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.18841159343719482, - "train/contrastive_loss": 1.492918848991394, - "train/negative_loss": 1.454498052597046, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.038420796394348145, - "train/total_loss": 0.4869953691959381 + "train/classification_loss": 0.1572113335132599, + "train/contrastive_loss": 0.7504340410232544, + "train/negative_loss": 0.7349439859390259, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.015490069054067135, + "train/total_loss": 0.30729812383651733 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.16087009012699127, - "train/contrastive_loss": 2.323456048965454, - "train/negative_loss": 0.936522901058197, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.3869330883026123, - "train/total_loss": 0.6255612969398499 + "train/classification_loss": 0.20097024738788605, + "train/contrastive_loss": 3.7277727127075195, + "train/negative_loss": 1.5457643270492554, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.1820082664489746, + "train/total_loss": 0.9465247988700867 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.21629714965820312, - "train/contrastive_loss": 0.9931620359420776, - "train/negative_loss": 0.2764371335506439, - "train/num_negatives": 44, + "train/classification_loss": 0.15162619948387146, + "train/contrastive_loss": 2.49060320854187, + "train/negative_loss": 2.3157835006713867, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.7167248725891113, - "train/total_loss": 0.4149295687675476 + "train/positive_loss": 0.17481963336467743, + "train/total_loss": 0.649746835231781 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.2802070081233978, - "train/contrastive_loss": 1.351233959197998, - "train/negative_loss": 1.2876536846160889, - "train/num_negatives": 44, + "train/classification_loss": 0.1228061392903328, + "train/contrastive_loss": 2.7641682624816895, + "train/negative_loss": 2.17568302154541, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.0635802149772644, - "train/total_loss": 0.550453782081604 + "train/positive_loss": 0.5884852409362793, + "train/total_loss": 0.675639808177948 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.12829634547233582, - "train/contrastive_loss": 1.0104339122772217, - "train/negative_loss": 0.2518037259578705, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.7586301565170288, - "train/total_loss": 0.3303831219673157 + "train/classification_loss": 0.1735696792602539, + "train/contrastive_loss": 2.5100314617156982, + "train/negative_loss": 2.0456044673919678, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.4644269347190857, + "train/total_loss": 0.6755759716033936 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.12986783683300018, - "train/contrastive_loss": 0.32160302996635437, - "train/negative_loss": 0.31117120385169983, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.010431827045977116, - "train/total_loss": 0.1941884458065033 + "train/classification_loss": 0.24511320888996124, + "train/contrastive_loss": 3.0371694564819336, + "train/negative_loss": 2.0945348739624023, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.9426344633102417, + "train/total_loss": 0.8525471091270447 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.10910703241825104, - "train/contrastive_loss": 0.9432503581047058, - "train/negative_loss": 0.6096394062042236, + "train/classification_loss": 0.1792777180671692, + "train/contrastive_loss": 1.6307547092437744, + "train/negative_loss": 0.9269121885299683, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.3336109519004822, - "train/total_loss": 0.297757089138031 + "train/num_positives": 10, + "train/positive_loss": 0.7038425207138062, + "train/total_loss": 0.505428671836853 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.25786715745925903, - "train/contrastive_loss": 1.5562891960144043, - "train/negative_loss": 0.32869672775268555, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2275924682617188, - "train/total_loss": 0.5691249966621399 + "train/classification_loss": 0.2391292303800583, + "train/contrastive_loss": 3.885842800140381, + "train/negative_loss": 3.1626739501953125, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.7231688499450684, + "train/total_loss": 1.0162978172302246 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.2677094638347626, - "train/contrastive_loss": 2.528489112854004, - "train/negative_loss": 1.5119816064834595, + "train/classification_loss": 0.19246800243854523, + "train/contrastive_loss": 1.6253114938735962, + "train/negative_loss": 1.6245441436767578, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0165073871612549, - "train/total_loss": 0.7734073400497437 + "train/num_positives": 4, + "train/positive_loss": 0.0007673421059735119, + "train/total_loss": 0.5175303220748901 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.17607028782367706, - "train/contrastive_loss": 2.2362399101257324, - "train/negative_loss": 1.9997859001159668, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.2364540994167328, - "train/total_loss": 0.6233182549476624 + "train/classification_loss": 0.18269632756710052, + "train/contrastive_loss": 0.24485749006271362, + "train/negative_loss": 0.20135609805583954, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.043501388281583786, + "train/total_loss": 0.23166783154010773 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.17705130577087402, - "train/contrastive_loss": 0.9317057728767395, - "train/negative_loss": 0.6830798983573914, - "train/num_negatives": 40, + "train/classification_loss": 0.26650598645210266, + "train/contrastive_loss": 2.9885897636413574, + "train/negative_loss": 1.6735867261886597, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.24862585961818695, - "train/total_loss": 0.3633924722671509 - }, - { - "epoch": 8.745247148288973, - "step": 2300, - "train/classification_loss": 0.21474570035934448, - "train/contrastive_loss": 1.3934574127197266, - "train/negative_loss": 0.9899322986602783, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.40352514386177063, - "train/total_loss": 0.4934372007846832 + "train/positive_loss": 1.3150030374526978, + "train/total_loss": 0.8642239570617676 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1522168517112732, - "train/contrastive_loss": 1.8048934936523438, - "train/negative_loss": 0.6039363145828247, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.200957179069519, - "train/total_loss": 0.5131955146789551 - }, - { - "epoch": 8.745247148288973, - "step": 2300, - "train/classification_loss": 0.22807922959327698, - "train/contrastive_loss": 2.4680328369140625, - "train/negative_loss": 1.379908561706543, + "train/classification_loss": 0.20834429562091827, + "train/contrastive_loss": 1.2400048971176147, + "train/negative_loss": 1.2383698225021362, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.088124394416809, - "train/total_loss": 0.7216857671737671 - }, - { - "epoch": 8.745247148288973, - "step": 2300, - "train/classification_loss": 0.27649426460266113, - "train/contrastive_loss": 1.3497990369796753, - "train/negative_loss": 1.3492777347564697, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005212592659518123, - "train/total_loss": 0.5464540719985962 + "train/num_positives": 10, + "train/positive_loss": 0.0016350996447727084, + "train/total_loss": 0.45634526014328003 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.21252788603305817, - "train/contrastive_loss": 1.9090322256088257, - "train/negative_loss": 1.0151704549789429, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.8938617706298828, - "train/total_loss": 0.5943343639373779 + "train/classification_loss": 0.1626977175474167, + "train/contrastive_loss": 1.3122689723968506, + "train/negative_loss": 1.306136965751648, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0061319489032030106, + "train/total_loss": 0.425151526927948 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.20080476999282837, - "train/contrastive_loss": 3.803225517272949, - "train/negative_loss": 2.300137519836426, + "train/classification_loss": 0.16451436281204224, + "train/contrastive_loss": 2.6817378997802734, + "train/negative_loss": 1.554318904876709, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 1.5030879974365234, - "train/total_loss": 0.9614498615264893 + "train/positive_loss": 1.127418875694275, + "train/total_loss": 0.700861930847168 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.17966322600841522, - "train/contrastive_loss": 3.9475831985473633, - "train/negative_loss": 1.4058130979537964, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.5417702198028564, - "train/total_loss": 0.9691798686981201 + "train/classification_loss": 0.18853893876075745, + "train/contrastive_loss": 1.156378984451294, + "train/negative_loss": 0.5881754755973816, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5682035684585571, + "train/total_loss": 0.41981473565101624 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1638893038034439, - "train/contrastive_loss": 0.9626883268356323, - "train/negative_loss": 0.7429466247558594, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.21974170207977295, - "train/total_loss": 0.3564269542694092 + "train/classification_loss": 0.23048639297485352, + "train/contrastive_loss": 2.103973865509033, + "train/negative_loss": 1.7719988822937012, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.3319750726222992, + "train/total_loss": 0.6512811779975891 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.19388850033283234, - "train/contrastive_loss": 1.3062067031860352, - "train/negative_loss": 0.951777994632721, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.354428768157959, - "train/total_loss": 0.45512986183166504 + "train/classification_loss": 0.24674762785434723, + "train/contrastive_loss": 1.657181739807129, + "train/negative_loss": 1.3021827936172485, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.35499894618988037, + "train/total_loss": 0.5781840085983276 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.19720274209976196, - "train/contrastive_loss": 1.6345824003219604, - "train/negative_loss": 1.595065951347351, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.03951645269989967, - "train/total_loss": 0.5241192579269409 + "train/classification_loss": 0.14322857558727264, + "train/contrastive_loss": 2.511337995529175, + "train/negative_loss": 2.511237144470215, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.00010087047121487558, + "train/total_loss": 0.6454961895942688 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.18273985385894775, - "train/contrastive_loss": 1.7057920694351196, - "train/negative_loss": 1.6898945569992065, + "train/classification_loss": 0.2110125571489334, + "train/contrastive_loss": 1.54874587059021, + "train/negative_loss": 0.8461430668830872, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.015897564589977264, - "train/total_loss": 0.5238982439041138 + "train/num_positives": 8, + "train/positive_loss": 0.702602744102478, + "train/total_loss": 0.5207617282867432 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.16329535841941833, - "train/contrastive_loss": 0.7608721256256104, - "train/negative_loss": 0.7259606719017029, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.034911446273326874, - "train/total_loss": 0.31546980142593384 + "train/classification_loss": 0.2378484010696411, + "train/contrastive_loss": 1.8977556228637695, + "train/negative_loss": 1.5594482421875, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.33830738067626953, + "train/total_loss": 0.6173995733261108 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.19093585014343262, - "train/contrastive_loss": 2.30086350440979, - "train/negative_loss": 1.7619953155517578, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.538868248462677, - "train/total_loss": 0.6511085629463196 + "train/classification_loss": 0.20430578291416168, + "train/contrastive_loss": 0.7996668219566345, + "train/negative_loss": 0.3860071003437042, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.4136597216129303, + "train/total_loss": 0.3642391562461853 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.20809049904346466, - "train/contrastive_loss": 0.9592143297195435, - "train/negative_loss": 0.38255760073661804, + "train/classification_loss": 0.2435009628534317, + "train/contrastive_loss": 3.9582719802856445, + "train/negative_loss": 1.2625460624694824, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.5766567587852478, - "train/total_loss": 0.3999333679676056 + "train/num_positives": 8, + "train/positive_loss": 2.695725917816162, + "train/total_loss": 1.0351554155349731 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1507195085287094, - "train/contrastive_loss": 2.2637648582458496, - "train/negative_loss": 1.1590771675109863, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.1046876907348633, - "train/total_loss": 0.6034724712371826 + "train/classification_loss": 0.14390785992145538, + "train/contrastive_loss": 1.3989417552947998, + "train/negative_loss": 0.8301483988761902, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.5687934160232544, + "train/total_loss": 0.42369621992111206 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.14869409799575806, - "train/contrastive_loss": 0.6911836862564087, - "train/negative_loss": 0.20212247967720032, - "train/num_negatives": 40, + "train/classification_loss": 0.16942669451236725, + "train/contrastive_loss": 2.480360507965088, + "train/negative_loss": 1.3820008039474487, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.48906123638153076, - "train/total_loss": 0.2869308590888977 + "train/positive_loss": 1.0983595848083496, + "train/total_loss": 0.6654987931251526 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.2695881426334381, - "train/contrastive_loss": 1.6793649196624756, - "train/negative_loss": 1.0974435806274414, - "train/num_negatives": 48, + "train/classification_loss": 0.17368774116039276, + "train/contrastive_loss": 0.5367939472198486, + "train/negative_loss": 0.5365847945213318, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00020916196808684617, + "train/total_loss": 0.2810465395450592 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.2790934145450592, + "train/contrastive_loss": 1.247010350227356, + "train/negative_loss": 1.0117290019989014, + "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.5819213390350342, - "train/total_loss": 0.6054611206054688 + "train/positive_loss": 0.23528137803077698, + "train/total_loss": 0.5284954905509949 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.10421501100063324, - "train/contrastive_loss": 0.19768022000789642, - "train/negative_loss": 0.19766490161418915, + "train/classification_loss": 0.17889797687530518, + "train/contrastive_loss": 0.9467892646789551, + "train/negative_loss": 0.9327142834663391, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.014075009152293205, + "train/total_loss": 0.3682558536529541 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.32379627227783203, + "train/contrastive_loss": 2.387416362762451, + "train/negative_loss": 1.2085150480270386, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 1.1789014339447021, + "train/total_loss": 0.8012795448303223 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.1566537767648697, + "train/contrastive_loss": 1.6297328472137451, + "train/negative_loss": 1.0654380321502686, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5642948150634766, + "train/total_loss": 0.4826003313064575 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.2062344253063202, + "train/contrastive_loss": 3.2087810039520264, + "train/negative_loss": 2.774134397506714, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4346466660499573, + "train/total_loss": 0.8479906320571899 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.22560301423072815, + "train/contrastive_loss": 2.996796131134033, + "train/negative_loss": 2.996795177459717, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.5318579244194552e-05, - "train/total_loss": 0.14375105500221252 + "train/num_positives": 2, + "train/positive_loss": 9.536747711536009e-07, + "train/total_loss": 0.8249622583389282 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.14614666998386383, - "train/contrastive_loss": 0.4793166220188141, - "train/negative_loss": 0.4410642385482788, - "train/num_negatives": 38, + "train/classification_loss": 0.1849716305732727, + "train/contrastive_loss": 2.3432679176330566, + "train/negative_loss": 1.2241214513778687, + "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.03825238347053528, - "train/total_loss": 0.2420099973678589 + "train/positive_loss": 1.1191463470458984, + "train/total_loss": 0.6536252498626709 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.12269327044487, - "train/contrastive_loss": 1.057956337928772, - "train/negative_loss": 0.939552366733551, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.11840400844812393, - "train/total_loss": 0.33428454399108887 + "train/classification_loss": 0.12908166646957397, + "train/contrastive_loss": 0.1698368489742279, + "train/negative_loss": 0.10628936439752579, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.06354749202728271, + "train/total_loss": 0.16304904222488403 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.20189327001571655, - "train/contrastive_loss": 2.2615408897399902, - "train/negative_loss": 1.8041224479675293, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.45741844177246094, - "train/total_loss": 0.6542014479637146 + "train/classification_loss": 0.18918542563915253, + "train/contrastive_loss": 0.9553216695785522, + "train/negative_loss": 0.9142136573791504, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.041108034551143646, + "train/total_loss": 0.3802497684955597 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15396921336650848, - "train/contrastive_loss": 1.174849271774292, - "train/negative_loss": 0.5957318544387817, - "train/num_negatives": 42, + "train/classification_loss": 0.2061411440372467, + "train/contrastive_loss": 1.1246836185455322, + "train/negative_loss": 1.087032675743103, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 0.5791174173355103, - "train/total_loss": 0.3889390826225281 + "train/positive_loss": 0.037650998681783676, + "train/total_loss": 0.43107786774635315 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15312954783439636, - "train/contrastive_loss": 0.6024721264839172, - "train/negative_loss": 0.5658827424049377, - "train/num_negatives": 50, + "train/classification_loss": 0.29631879925727844, + "train/contrastive_loss": 2.7426772117614746, + "train/negative_loss": 1.6752409934997559, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 0.03658938407897949, - "train/total_loss": 0.2736239731311798 + "train/positive_loss": 1.0674362182617188, + "train/total_loss": 0.8448542356491089 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.21128174662590027, - "train/contrastive_loss": 1.9345735311508179, - "train/negative_loss": 0.9108494520187378, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.02372407913208, - "train/total_loss": 0.5981964468955994 + "train/classification_loss": 0.13911233842372894, + "train/contrastive_loss": 0.5739650726318359, + "train/negative_loss": 0.3104524314403534, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.26351261138916016, + "train/total_loss": 0.25390535593032837 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.23375721275806427, - "train/contrastive_loss": 3.3098177909851074, - "train/negative_loss": 2.2790353298187256, + "train/classification_loss": 0.12644430994987488, + "train/contrastive_loss": 0.8025156259536743, + "train/negative_loss": 0.2920730710029602, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 1.0307825803756714, - "train/total_loss": 0.8957207798957825 + "train/positive_loss": 0.5104425549507141, + "train/total_loss": 0.28694742918014526 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.1651710867881775, + "train/contrastive_loss": 1.9835624694824219, + "train/negative_loss": 0.7725695371627808, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.2109929323196411, + "train/total_loss": 0.5618835687637329 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.2049207091331482, + "train/contrastive_loss": 2.5237317085266113, + "train/negative_loss": 0.8629840612411499, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.6607476472854614, + "train/total_loss": 0.7096670866012573 + }, + { + "epoch": 8.098591549295774, + "step": 2300, + "train/classification_loss": 0.18920323252677917, + "train/contrastive_loss": 1.006458044052124, + "train/negative_loss": 0.6816026568412781, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.32485535740852356, + "train/total_loss": 0.39049482345581055 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15723386406898499, - "train/contrastive_loss": 0.3471164405345917, - "train/negative_loss": 0.21548664569854736, + "train/classification_loss": 0.11797206848859787, + "train/contrastive_loss": 0.553642213344574, + "train/negative_loss": 0.5504075884819031, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.1316297948360443, - "train/total_loss": 0.22665715217590332 + "train/num_positives": 16, + "train/positive_loss": 0.0032346013467758894, + "train/total_loss": 0.22870051860809326 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.17206035554409027, - "train/contrastive_loss": 3.089056968688965, - "train/negative_loss": 1.8076468706130981, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2814102172851562, - "train/total_loss": 0.7898717522621155 + "train/classification_loss": 0.18942297995090485, + "train/contrastive_loss": 2.5242488384246826, + "train/negative_loss": 1.4783424139022827, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.0459064245224, + "train/total_loss": 0.6942727565765381 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.24277779459953308, - "train/contrastive_loss": 3.222731590270996, - "train/negative_loss": 1.3183119297027588, + "train/classification_loss": 0.2820577621459961, + "train/contrastive_loss": 2.3094828128814697, + "train/negative_loss": 2.0089049339294434, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.9044196605682373, - "train/total_loss": 0.8873240947723389 + "train/num_positives": 2, + "train/positive_loss": 0.30057796835899353, + "train/total_loss": 0.7439543008804321 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.20272696018218994, - "train/contrastive_loss": 2.3288824558258057, - "train/negative_loss": 1.1671216487884521, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.1617608070373535, - "train/total_loss": 0.66850346326828 + "train/classification_loss": 0.13928921520709991, + "train/contrastive_loss": 2.8141512870788574, + "train/negative_loss": 1.2586567401885986, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.5554946660995483, + "train/total_loss": 0.7021194696426392 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.1784418374300003, - "train/contrastive_loss": 2.877772569656372, - "train/negative_loss": 2.432982921600342, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.44478967785835266, - "train/total_loss": 0.7539963722229004 + "train/classification_loss": 0.17805629968643188, + "train/contrastive_loss": 1.3132739067077637, + "train/negative_loss": 0.9032646417617798, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.4100092053413391, + "train/total_loss": 0.4407110810279846 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.2190650999546051, - "train/contrastive_loss": 3.607996702194214, - "train/negative_loss": 1.8978155851364136, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.7101811170578003, - "train/total_loss": 0.9406644105911255 + "train/classification_loss": 0.1912367194890976, + "train/contrastive_loss": 2.892659902572632, + "train/negative_loss": 0.8198800683021545, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 2.072779893875122, + "train/total_loss": 0.7697687149047852 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.23115646839141846, - "train/contrastive_loss": 3.3550074100494385, - "train/negative_loss": 2.298611640930176, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0563957691192627, - "train/total_loss": 0.9021579623222351 + "train/classification_loss": 0.1900109350681305, + "train/contrastive_loss": 6.243737697601318, + "train/negative_loss": 6.243734836578369, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.8491119792306563e-06, + "train/total_loss": 1.4387584924697876 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.26809728145599365, - "train/contrastive_loss": 2.789905548095703, - "train/negative_loss": 1.5918116569519043, + "train/classification_loss": 0.1916729211807251, + "train/contrastive_loss": 2.114192485809326, + "train/negative_loss": 0.4543111324310303, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.1980940103530884, - "train/total_loss": 0.8260784149169922 + "train/positive_loss": 1.6598812341690063, + "train/total_loss": 0.6145114302635193 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.18597695231437683, - "train/contrastive_loss": 1.0090585947036743, - "train/negative_loss": 1.0039710998535156, + "train/classification_loss": 0.23355406522750854, + "train/contrastive_loss": 3.058589458465576, + "train/negative_loss": 1.378065824508667, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0050875055603682995, - "train/total_loss": 0.38778865337371826 + "train/num_positives": 8, + "train/positive_loss": 1.6805236339569092, + "train/total_loss": 0.8452719449996948 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15177950263023376, - "train/contrastive_loss": 1.2076460123062134, - "train/negative_loss": 0.3711972236633301, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8364487886428833, - "train/total_loss": 0.39330869913101196 + "train/classification_loss": 0.16609349846839905, + "train/contrastive_loss": 2.6771068572998047, + "train/negative_loss": 1.1652591228485107, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.511847734451294, + "train/total_loss": 0.7015148401260376 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.15515105426311493, - "train/contrastive_loss": 1.5366243124008179, - "train/negative_loss": 0.548648476600647, - "train/num_negatives": 46, + "train/classification_loss": 0.2662345767021179, + "train/contrastive_loss": 2.5414786338806152, + "train/negative_loss": 2.198185443878174, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.9879758358001709, - "train/total_loss": 0.46247589588165283 + "train/positive_loss": 0.34329307079315186, + "train/total_loss": 0.774530291557312 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.23389965295791626, - "train/contrastive_loss": 1.5958974361419678, - "train/negative_loss": 1.5958974361419678, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5530791282653809 - }, - { - "epoch": 8.745247148288973, - "eval_exact_match_accuracy": 0.2742857142857143, - "eval_hamming_loss": 0.06901960784313725, - "eval_loss": 0.5501063466072083, - "eval_macro_f1": 0.27354645675116246, - "eval_macro_precision": 0.5551888932712081, - "eval_macro_recall": 0.20422488526490196, - "eval_micro_f1": 0.5149606299212598, - "eval_micro_precision": 0.8363171355498721, - "eval_micro_recall": 0.3720136518771331, - "eval_runtime": 2.6317, - "eval_samples_per_second": 199.49, - "eval_steps_per_second": 25.079, + "train/classification_loss": 0.16836853325366974, + "train/contrastive_loss": 0.46617648005485535, + "train/negative_loss": 0.4631706476211548, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.0030058410484343767, + "train/total_loss": 0.26160383224487305 + }, + { + "epoch": 8.098591549295774, + "eval_exact_match_accuracy": 0.2821869488536155, + "eval_hamming_loss": 0.07116920842411038, + "eval_loss": 0.5833853483200073, + "eval_macro_f1": 0.3069332640464957, + "eval_macro_precision": 0.48224143083602977, + "eval_macro_recall": 0.2493488712169924, + "eval_micro_f1": 0.5134751773049645, + "eval_micro_precision": 0.7669491525423728, + "eval_micro_recall": 0.3859275053304904, + "eval_runtime": 2.845, + "eval_samples_per_second": 199.297, + "eval_steps_per_second": 24.956, "step": 2300 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.22690388560295105, - "train/contrastive_loss": 1.4364670515060425, - "train/negative_loss": 0.6752392649650574, - "train/num_negatives": 36, - "train/num_positives": 10, - "train/positive_loss": 0.7612277865409851, - "train/total_loss": 0.5141972899436951 + "train/classification_loss": 0.10601180046796799, + "train/contrastive_loss": 0.4751158058643341, + "train/negative_loss": 0.4748990535736084, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.00021674255549442023, + "train/total_loss": 0.20103496313095093 }, { - "epoch": 8.745247148288973, + "epoch": 8.098591549295774, "step": 2300, - "train/classification_loss": 0.2159840315580368, - "train/contrastive_loss": 0.920192301273346, - "train/negative_loss": 0.5905598402023315, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.3296324610710144, - "train/total_loss": 0.4000225067138672 + "train/classification_loss": 0.17395861446857452, + "train/contrastive_loss": 0.9130652546882629, + "train/negative_loss": 0.4688066840171814, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.44425857067108154, + "train/total_loss": 0.35657167434692383 }, { - "epoch": 8.935361216730039, - "grad_norm": 9.3977689743042, - "learning_rate": 1.965799086757991e-05, - "loss": 0.7337, + "epoch": 8.274647887323944, + "grad_norm": 18.140853881835938, + "learning_rate": 1.968343904157858e-05, + "loss": 0.7399, "step": 2350 }, { - "epoch": 8.935361216730039, + "epoch": 8.274647887323944, "step": 2350, - "train/classification_loss": 0.132734015583992, - "train/contrastive_loss": 0.5070638060569763, - "train/negative_loss": 0.32200008630752563, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.18506371974945068, - "train/total_loss": 0.23414677381515503 + "train/classification_loss": 0.14559383690357208, + "train/contrastive_loss": 1.428407073020935, + "train/negative_loss": 0.6315807104110718, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7968263626098633, + "train/total_loss": 0.43127524852752686 }, { - "epoch": 8.935361216730039, + "epoch": 8.274647887323944, "step": 2350, - "train/classification_loss": 0.1986212432384491, - "train/contrastive_loss": 0.5779910683631897, - "train/negative_loss": 0.5601039528846741, - "train/num_negatives": 44, + "train/classification_loss": 0.23761597275733948, + "train/contrastive_loss": 0.7272334694862366, + "train/negative_loss": 0.7253899574279785, + "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.017887098714709282, - "train/total_loss": 0.31421947479248047 + "train/positive_loss": 0.0018435402307659388, + "train/total_loss": 0.3830626606941223 }, { - "epoch": 9.125475285171103, - "grad_norm": 11.41215705871582, - "learning_rate": 1.9650380517503808e-05, - "loss": 0.6664, + "epoch": 8.450704225352112, + "grad_norm": 13.615300178527832, + "learning_rate": 1.9676391825229034e-05, + "loss": 0.7359, "step": 2400 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2511802017688751, - "train/contrastive_loss": 2.170243263244629, - "train/negative_loss": 0.9737837910652161, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.1964595317840576, - "train/total_loss": 0.6852288246154785 + "train/classification_loss": 0.2449459731578827, + "train/contrastive_loss": 2.094484567642212, + "train/negative_loss": 1.164997935295105, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9294866323471069, + "train/total_loss": 0.6638429164886475 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.20259812474250793, - "train/contrastive_loss": 2.0097484588623047, - "train/negative_loss": 0.9516550302505493, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.058093547821045, - "train/total_loss": 0.6045478582382202 + "train/classification_loss": 0.2569793164730072, + "train/contrastive_loss": 1.2955036163330078, + "train/negative_loss": 0.8844051361083984, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.4110984206199646, + "train/total_loss": 0.5160800218582153 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.16038626432418823, - "train/contrastive_loss": 1.0297057628631592, - "train/negative_loss": 0.15766233205795288, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8720433712005615, - "train/total_loss": 0.3663274049758911 + "train/classification_loss": 0.2583286762237549, + "train/contrastive_loss": 2.991950035095215, + "train/negative_loss": 1.8696959018707275, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1222542524337769, + "train/total_loss": 0.8567187190055847 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2000766396522522, - "train/contrastive_loss": 2.511446475982666, - "train/negative_loss": 1.6633141040802002, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.8481324315071106, - "train/total_loss": 0.7023659348487854 + "train/classification_loss": 0.14321866631507874, + "train/contrastive_loss": 1.5693767070770264, + "train/negative_loss": 1.141835331916809, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4275414049625397, + "train/total_loss": 0.4570940136909485 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.12047658115625381, - "train/contrastive_loss": 2.154038190841675, - "train/negative_loss": 2.0316579341888428, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.12238036841154099, - "train/total_loss": 0.5512842535972595 + "train/classification_loss": 0.20901921391487122, + "train/contrastive_loss": 2.5436007976531982, + "train/negative_loss": 2.3255441188812256, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.21805673837661743, + "train/total_loss": 0.7177393436431885 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1678415834903717, - "train/contrastive_loss": 1.9030072689056396, - "train/negative_loss": 1.4386132955551147, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.4643939733505249, - "train/total_loss": 0.548443078994751 + "train/classification_loss": 0.20494309067726135, + "train/contrastive_loss": 2.2672677040100098, + "train/negative_loss": 1.3010964393615723, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.966171383857727, + "train/total_loss": 0.6583966016769409 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.19565823674201965, - "train/contrastive_loss": 1.1001040935516357, - "train/negative_loss": 0.8346403241157532, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.2654637098312378, - "train/total_loss": 0.41567903757095337 + "train/classification_loss": 0.18722404539585114, + "train/contrastive_loss": 1.4128552675247192, + "train/negative_loss": 0.8419068455696106, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.5709484219551086, + "train/total_loss": 0.4697951078414917 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1592833399772644, - "train/contrastive_loss": 1.6189165115356445, - "train/negative_loss": 1.1262015104293823, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4927150309085846, - "train/total_loss": 0.4830666482448578 + "train/classification_loss": 0.1948729008436203, + "train/contrastive_loss": 1.3329535722732544, + "train/negative_loss": 1.3328713178634644, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 8.225779311032966e-05, + "train/total_loss": 0.4614636301994324 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.13626140356063843, - "train/contrastive_loss": 0.6616687774658203, - "train/negative_loss": 0.619294285774231, + "train/classification_loss": 0.10457542538642883, + "train/contrastive_loss": 0.5528663396835327, + "train/negative_loss": 0.35733428597450256, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.04237447306513786, - "train/total_loss": 0.2685951590538025 + "train/positive_loss": 0.19553205370903015, + "train/total_loss": 0.2151486873626709 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.32168328762054443, - "train/contrastive_loss": 3.5373449325561523, - "train/negative_loss": 1.4782453775405884, + "train/classification_loss": 0.168312206864357, + "train/contrastive_loss": 1.2611491680145264, + "train/negative_loss": 0.9446191191673279, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 2.0590994358062744, - "train/total_loss": 1.029152274131775 + "train/num_positives": 14, + "train/positive_loss": 0.3165300786495209, + "train/total_loss": 0.42054206132888794 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1919061690568924, - "train/contrastive_loss": 2.037508964538574, - "train/negative_loss": 1.5070658922195435, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.5304429531097412, - "train/total_loss": 0.599407970905304 + "train/classification_loss": 0.15372414886951447, + "train/contrastive_loss": 1.440199613571167, + "train/negative_loss": 0.7387551665306091, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.7014443874359131, + "train/total_loss": 0.44176405668258667 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.12206913530826569, - "train/contrastive_loss": 1.349036693572998, - "train/negative_loss": 0.6220868229866028, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.7269498109817505, - "train/total_loss": 0.3918764591217041 + "train/classification_loss": 0.17469422519207, + "train/contrastive_loss": 2.0290565490722656, + "train/negative_loss": 2.0175931453704834, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.011463319882750511, + "train/total_loss": 0.5805055499076843 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18481220304965973, - "train/contrastive_loss": 3.8380415439605713, - "train/negative_loss": 2.4277877807617188, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4102537631988525, - "train/total_loss": 0.9524205327033997 + "train/classification_loss": 0.20461958646774292, + "train/contrastive_loss": 3.3113276958465576, + "train/negative_loss": 1.6892004013061523, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.6221272945404053, + "train/total_loss": 0.8668851256370544 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1186649352312088, - "train/contrastive_loss": 1.0392698049545288, - "train/negative_loss": 1.0391851663589478, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 8.464067650493234e-05, - "train/total_loss": 0.3265188932418823 + "train/classification_loss": 0.16668808460235596, + "train/contrastive_loss": 1.0202604532241821, + "train/negative_loss": 0.8316395878791809, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.18862083554267883, + "train/total_loss": 0.3707401752471924 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.12986059486865997, - "train/contrastive_loss": 1.8427261114120483, - "train/negative_loss": 1.5478070974349976, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.2949190139770508, - "train/total_loss": 0.4984058141708374 + "train/classification_loss": 0.1361311972141266, + "train/contrastive_loss": 2.1061978340148926, + "train/negative_loss": 0.8262069225311279, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.2799909114837646, + "train/total_loss": 0.5573707818984985 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.13706527650356293, - "train/contrastive_loss": 0.663161039352417, - "train/negative_loss": 0.5512534379959106, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.11190757900476456, - "train/total_loss": 0.26969748735427856 + "train/classification_loss": 0.15822388231754303, + "train/contrastive_loss": 1.2653664350509644, + "train/negative_loss": 0.40365445613861084, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.8617119789123535, + "train/total_loss": 0.4112972021102905 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2519212067127228, - "train/contrastive_loss": 2.9849891662597656, - "train/negative_loss": 1.5495078563690186, - "train/num_negatives": 40, + "train/classification_loss": 0.1280098557472229, + "train/contrastive_loss": 1.095563530921936, + "train/negative_loss": 0.45390164852142334, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.4354811906814575, - "train/total_loss": 0.8489190340042114 + "train/positive_loss": 0.6416618824005127, + "train/total_loss": 0.34712255001068115 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1596565544605255, - "train/contrastive_loss": 1.026837706565857, - "train/negative_loss": 0.1485150158405304, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8783226609230042, - "train/total_loss": 0.3650240898132324 + "train/classification_loss": 0.18794164061546326, + "train/contrastive_loss": 0.4926373064517975, + "train/negative_loss": 0.2894083559513092, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.20322895050048828, + "train/total_loss": 0.28646910190582275 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18130117654800415, - "train/contrastive_loss": 1.3602657318115234, - "train/negative_loss": 1.357795238494873, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0024704409297555685, - "train/total_loss": 0.4533543288707733 + "train/classification_loss": 0.14979209005832672, + "train/contrastive_loss": 0.8436325192451477, + "train/negative_loss": 0.5042153000831604, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.3394172191619873, + "train/total_loss": 0.31851857900619507 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1669357568025589, - "train/contrastive_loss": 3.198763847351074, - "train/negative_loss": 1.6959469318389893, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.502816915512085, - "train/total_loss": 0.8066885471343994 + "train/classification_loss": 0.19912217557430267, + "train/contrastive_loss": 2.5443177223205566, + "train/negative_loss": 1.503640055656433, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.040677547454834, + "train/total_loss": 0.7079857587814331 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.23881854116916656, - "train/contrastive_loss": 1.9382538795471191, - "train/negative_loss": 0.4318777918815613, - "train/num_negatives": 44, + "train/classification_loss": 0.16029615700244904, + "train/contrastive_loss": 2.637667655944824, + "train/negative_loss": 2.5243072509765625, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.5063761472702026, - "train/total_loss": 0.6264693140983582 + "train/positive_loss": 0.11336030811071396, + "train/total_loss": 0.6878296732902527 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2520308792591095, - "train/contrastive_loss": 1.726111888885498, - "train/negative_loss": 1.128849744796753, - "train/num_negatives": 44, + "train/classification_loss": 0.12428630143404007, + "train/contrastive_loss": 2.6403861045837402, + "train/negative_loss": 2.0968854427337646, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.5972621440887451, - "train/total_loss": 0.5972532629966736 + "train/positive_loss": 0.5435007214546204, + "train/total_loss": 0.6523635387420654 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.13531456887722015, - "train/contrastive_loss": 1.2159593105316162, - "train/negative_loss": 0.2780739665031433, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9378854036331177, - "train/total_loss": 0.3785064220428467 + "train/classification_loss": 0.16106870770454407, + "train/contrastive_loss": 3.2484290599823, + "train/negative_loss": 1.6945791244506836, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.5538499355316162, + "train/total_loss": 0.8107545375823975 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1285882592201233, - "train/contrastive_loss": 0.1665187031030655, - "train/negative_loss": 0.16572539508342743, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.0007933135493658483, - "train/total_loss": 0.16189199686050415 + "train/classification_loss": 0.2549956738948822, + "train/contrastive_loss": 3.269454002380371, + "train/negative_loss": 1.4515544176101685, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.8178997039794922, + "train/total_loss": 0.9088864326477051 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.09618305414915085, - "train/contrastive_loss": 0.7044481635093689, - "train/negative_loss": 0.6745692491531372, + "train/classification_loss": 0.18278349936008453, + "train/contrastive_loss": 2.224982976913452, + "train/negative_loss": 0.7934094667434692, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.029878908768296242, - "train/total_loss": 0.2370726764202118 + "train/num_positives": 10, + "train/positive_loss": 1.431573510169983, + "train/total_loss": 0.6277800798416138 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2676226496696472, - "train/contrastive_loss": 2.0320072174072266, - "train/negative_loss": 0.3073628842830658, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.724644422531128, - "train/total_loss": 0.6740241050720215 + "train/classification_loss": 0.2195686250925064, + "train/contrastive_loss": 3.277425527572632, + "train/negative_loss": 2.4933409690856934, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.7840845584869385, + "train/total_loss": 0.8750537037849426 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2831410765647888, - "train/contrastive_loss": 3.1870317459106445, - "train/negative_loss": 1.343204140663147, + "train/classification_loss": 0.19263122975826263, + "train/contrastive_loss": 1.8158292770385742, + "train/negative_loss": 1.8146997690200806, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.843827486038208, - "train/total_loss": 0.9205474257469177 + "train/num_positives": 4, + "train/positive_loss": 0.0011294549331068993, + "train/total_loss": 0.5557971000671387 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1696857362985611, - "train/contrastive_loss": 2.4789047241210938, - "train/negative_loss": 2.2164525985717773, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.26245200634002686, - "train/total_loss": 0.6654666662216187 + "train/classification_loss": 0.16757798194885254, + "train/contrastive_loss": 0.24850153923034668, + "train/negative_loss": 0.22848138213157654, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.02002016268670559, + "train/total_loss": 0.21727828681468964 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.19147087633609772, - "train/contrastive_loss": 0.9116272926330566, - "train/negative_loss": 0.7156822085380554, - "train/num_negatives": 40, + "train/classification_loss": 0.2757203280925751, + "train/contrastive_loss": 2.6667003631591797, + "train/negative_loss": 1.565339207649231, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.19594505429267883, - "train/total_loss": 0.37379634380340576 - }, - { - "epoch": 9.125475285171103, - "step": 2400, - "train/classification_loss": 0.21057751774787903, - "train/contrastive_loss": 1.115084171295166, - "train/negative_loss": 0.33964794874191284, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.7754362225532532, - "train/total_loss": 0.43359434604644775 - }, - { - "epoch": 9.125475285171103, - "step": 2400, - "train/classification_loss": 0.14854823052883148, - "train/contrastive_loss": 2.4648561477661133, - "train/negative_loss": 1.4634236097335815, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.0014326572418213, - "train/total_loss": 0.6415194869041443 + "train/positive_loss": 1.1013610363006592, + "train/total_loss": 0.8090604543685913 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2248719036579132, - "train/contrastive_loss": 3.0298264026641846, - "train/negative_loss": 1.4284781217575073, + "train/classification_loss": 0.19449162483215332, + "train/contrastive_loss": 0.5649770498275757, + "train/negative_loss": 0.5641927123069763, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.6013482809066772, - "train/total_loss": 0.8308372497558594 - }, - { - "epoch": 9.125475285171103, - "step": 2400, - "train/classification_loss": 0.25868499279022217, - "train/contrastive_loss": 1.3779834508895874, - "train/negative_loss": 1.3774032592773438, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005802406813018024, - "train/total_loss": 0.5342817306518555 + "train/num_positives": 10, + "train/positive_loss": 0.0007843284984119236, + "train/total_loss": 0.30748704075813293 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.19850857555866241, - "train/contrastive_loss": 2.0333380699157715, - "train/negative_loss": 1.0055327415466309, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.0278053283691406, - "train/total_loss": 0.6051762104034424 + "train/classification_loss": 0.1655542105436325, + "train/contrastive_loss": 1.4574739933013916, + "train/negative_loss": 1.4567549228668213, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0007190585602074862, + "train/total_loss": 0.45704901218414307 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.19816087186336517, - "train/contrastive_loss": 3.7254724502563477, - "train/negative_loss": 2.269536018371582, + "train/classification_loss": 0.16483651101589203, + "train/contrastive_loss": 2.407829761505127, + "train/negative_loss": 1.40552818775177, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 1.4559364318847656, - "train/total_loss": 0.9432553648948669 + "train/positive_loss": 1.0023016929626465, + "train/total_loss": 0.6464024782180786 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.17845529317855835, - "train/contrastive_loss": 3.416855812072754, - "train/negative_loss": 1.2954436540603638, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.1214120388031006, - "train/total_loss": 0.861826479434967 + "train/classification_loss": 0.17835907638072968, + "train/contrastive_loss": 2.0878913402557373, + "train/negative_loss": 1.2990790605545044, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7888123393058777, + "train/total_loss": 0.5959373712539673 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.14055371284484863, - "train/contrastive_loss": 1.0178077220916748, - "train/negative_loss": 0.8930854797363281, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.12472224980592728, - "train/total_loss": 0.3441152572631836 + "train/classification_loss": 0.2198270857334137, + "train/contrastive_loss": 2.829572916030884, + "train/negative_loss": 1.9019861221313477, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.9275867938995361, + "train/total_loss": 0.7857416868209839 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18516314029693604, - "train/contrastive_loss": 0.9443204402923584, - "train/negative_loss": 0.7982211112976074, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.14609935879707336, - "train/total_loss": 0.3740272521972656 + "train/classification_loss": 0.23555278778076172, + "train/contrastive_loss": 1.746448040008545, + "train/negative_loss": 1.2962474822998047, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.450200617313385, + "train/total_loss": 0.5848424434661865 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.20002441108226776, - "train/contrastive_loss": 1.5055738687515259, - "train/negative_loss": 1.3288601636886597, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.1767137050628662, - "train/total_loss": 0.5011391639709473 + "train/classification_loss": 0.1378675252199173, + "train/contrastive_loss": 1.980405569076538, + "train/negative_loss": 1.9791914224624634, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.0012141054030507803, + "train/total_loss": 0.5339486598968506 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18809501826763153, - "train/contrastive_loss": 1.907532811164856, - "train/negative_loss": 1.8882229328155518, + "train/classification_loss": 0.20216575264930725, + "train/contrastive_loss": 1.2747738361358643, + "train/negative_loss": 0.6447005867958069, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.019309869036078453, - "train/total_loss": 0.5696015954017639 + "train/num_positives": 8, + "train/positive_loss": 0.6300731897354126, + "train/total_loss": 0.45712053775787354 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.16563040018081665, - "train/contrastive_loss": 0.8869033455848694, - "train/negative_loss": 0.8851439952850342, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.001759352977387607, - "train/total_loss": 0.3430110812187195 + "train/classification_loss": 0.23815526068210602, + "train/contrastive_loss": 3.062293291091919, + "train/negative_loss": 2.53509783744812, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.5271954536437988, + "train/total_loss": 0.8506138920783997 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18106219172477722, - "train/contrastive_loss": 3.860193967819214, - "train/negative_loss": 3.442403554916382, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.41779035329818726, - "train/total_loss": 0.9531010389328003 + "train/classification_loss": 0.20140235126018524, + "train/contrastive_loss": 1.0562694072723389, + "train/negative_loss": 0.7323762774467468, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.32389307022094727, + "train/total_loss": 0.4126562476158142 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1985945999622345, - "train/contrastive_loss": 1.2981218099594116, - "train/negative_loss": 0.6648949384689331, + "train/classification_loss": 0.2705965042114258, + "train/contrastive_loss": 3.890573024749756, + "train/negative_loss": 2.1461291313171387, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.6332268714904785, - "train/total_loss": 0.4582189619541168 + "train/num_positives": 8, + "train/positive_loss": 1.7444437742233276, + "train/total_loss": 1.0487110614776611 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.14659461379051208, - "train/contrastive_loss": 2.368844985961914, - "train/negative_loss": 1.2826223373413086, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.086222529411316, - "train/total_loss": 0.6203635931015015 + "train/classification_loss": 0.14587567746639252, + "train/contrastive_loss": 1.6785633563995361, + "train/negative_loss": 0.5967957377433777, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 1.0817675590515137, + "train/total_loss": 0.48158836364746094 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.13574792444705963, - "train/contrastive_loss": 1.7307813167572021, - "train/negative_loss": 0.9181351661682129, - "train/num_negatives": 40, + "train/classification_loss": 0.1672477424144745, + "train/contrastive_loss": 1.8323241472244263, + "train/negative_loss": 0.830080509185791, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8126460909843445, - "train/total_loss": 0.48190420866012573 + "train/positive_loss": 1.0022436380386353, + "train/total_loss": 0.5337125658988953 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.27918124198913574, - "train/contrastive_loss": 1.8695586919784546, - "train/negative_loss": 1.3522905111312866, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.517268180847168, - "train/total_loss": 0.6530929803848267 + "train/classification_loss": 0.1621384620666504, + "train/contrastive_loss": 0.747734010219574, + "train/negative_loss": 0.747294008731842, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0004400020989123732, + "train/total_loss": 0.3116852641105652 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1154903918504715, - "train/contrastive_loss": 1.0403162240982056, - "train/negative_loss": 1.0403141975402832, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.0265601961000357e-06, - "train/total_loss": 0.3235536217689514 + "train/classification_loss": 0.24401827156543732, + "train/contrastive_loss": 1.2871679067611694, + "train/negative_loss": 1.1827905178070068, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.104377381503582, + "train/total_loss": 0.501451849937439 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1557725965976715, - "train/contrastive_loss": 1.112598180770874, - "train/negative_loss": 0.7559860944747925, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.35661202669143677, - "train/total_loss": 0.3782922327518463 + "train/classification_loss": 0.16784295439720154, + "train/contrastive_loss": 0.9098984003067017, + "train/negative_loss": 0.9028022885322571, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.007096088957041502, + "train/total_loss": 0.34982264041900635 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.09190518409013748, - "train/contrastive_loss": 0.41600051522254944, - "train/negative_loss": 0.4149284064769745, + "train/classification_loss": 0.3237954378128052, + "train/contrastive_loss": 2.385223388671875, + "train/negative_loss": 1.2870439291000366, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0010721165454015136, - "train/total_loss": 0.1751052886247635 + "train/num_positives": 18, + "train/positive_loss": 1.098179578781128, + "train/total_loss": 0.8008401393890381 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.20577803254127502, - "train/contrastive_loss": 2.4352638721466064, - "train/negative_loss": 1.5413073301315308, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.8939565420150757, - "train/total_loss": 0.6928308010101318 + "train/classification_loss": 0.14544318616390228, + "train/contrastive_loss": 2.0616774559020996, + "train/negative_loss": 1.0446054935455322, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0170719623565674, + "train/total_loss": 0.5577786564826965 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1491461992263794, - "train/contrastive_loss": 1.723217487335205, - "train/negative_loss": 0.7167017459869385, + "train/classification_loss": 0.17914167046546936, + "train/contrastive_loss": 2.7266931533813477, + "train/negative_loss": 2.359682083129883, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.0065157413482666, - "train/total_loss": 0.4937897026538849 + "train/positive_loss": 0.3670111894607544, + "train/total_loss": 0.7244802713394165 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.14637495577335358, - "train/contrastive_loss": 0.3010910749435425, - "train/negative_loss": 0.30095118284225464, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00013989706349093467, - "train/total_loss": 0.20659317076206207 + "train/classification_loss": 0.2335483431816101, + "train/contrastive_loss": 2.696150302886963, + "train/negative_loss": 2.69614839553833, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 1.7881409348774469e-06, + "train/total_loss": 0.7727783918380737 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.20592135190963745, - "train/contrastive_loss": 1.9103419780731201, - "train/negative_loss": 0.8357800245285034, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0745619535446167, - "train/total_loss": 0.5879897475242615 + "train/classification_loss": 0.19012564420700073, + "train/contrastive_loss": 2.4143619537353516, + "train/negative_loss": 1.1258702278137207, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.2884916067123413, + "train/total_loss": 0.6729980707168579 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.21413733065128326, - "train/contrastive_loss": 2.173126220703125, - "train/negative_loss": 1.5421627759933472, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6309635043144226, - "train/total_loss": 0.648762583732605 + "train/classification_loss": 0.12416550517082214, + "train/contrastive_loss": 0.2659369707107544, + "train/negative_loss": 0.1255723387002945, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.1403646171092987, + "train/total_loss": 0.1773529052734375 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.16674919426441193, - "train/contrastive_loss": 0.9810001850128174, - "train/negative_loss": 0.40045222640037537, + "train/classification_loss": 0.19429625570774078, + "train/contrastive_loss": 1.1504722833633423, + "train/negative_loss": 0.9434749484062195, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5805479288101196, - "train/total_loss": 0.3629492521286011 + "train/num_positives": 8, + "train/positive_loss": 0.20699737966060638, + "train/total_loss": 0.4243907332420349 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.17181725800037384, - "train/contrastive_loss": 2.801069498062134, - "train/negative_loss": 2.1547772884368896, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6462922096252441, - "train/total_loss": 0.7320311665534973 + "train/classification_loss": 0.2082436978816986, + "train/contrastive_loss": 1.014721155166626, + "train/negative_loss": 0.8957695364952087, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.11895164847373962, + "train/total_loss": 0.41118794679641724 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.23232883214950562, - "train/contrastive_loss": 2.972302198410034, - "train/negative_loss": 1.2202600240707397, - "train/num_negatives": 46, + "train/classification_loss": 0.29638078808784485, + "train/contrastive_loss": 2.539285659790039, + "train/negative_loss": 1.3751596212387085, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 1.7520421743392944, - "train/total_loss": 0.8267892599105835 + "train/positive_loss": 1.1641261577606201, + "train/total_loss": 0.804237961769104 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.19885124266147614, - "train/contrastive_loss": 2.29836106300354, - "train/negative_loss": 1.806561827659607, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.4917992353439331, - "train/total_loss": 0.658523440361023 + "train/classification_loss": 0.144293412566185, + "train/contrastive_loss": 1.1578879356384277, + "train/negative_loss": 0.2715948224067688, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8862931728363037, + "train/total_loss": 0.3758710026741028 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18180318176746368, - "train/contrastive_loss": 2.773526191711426, - "train/negative_loss": 2.2326180934906006, + "train/classification_loss": 0.1365317702293396, + "train/contrastive_loss": 0.9785356521606445, + "train/negative_loss": 0.26192107796669006, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.5409079790115356, - "train/total_loss": 0.7365084290504456 + "train/positive_loss": 0.7166145443916321, + "train/total_loss": 0.33223891258239746 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.18250741064548492, + "train/contrastive_loss": 2.235269069671631, + "train/negative_loss": 1.0084832906723022, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.226785659790039, + "train/total_loss": 0.6295612454414368 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.22875982522964478, - "train/contrastive_loss": 3.6835312843322754, - "train/negative_loss": 1.9154335260391235, + "train/classification_loss": 0.19683633744716644, + "train/contrastive_loss": 2.222316265106201, + "train/negative_loss": 1.7189472913742065, "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.5033690333366394, + "train/total_loss": 0.6412996053695679 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.19557024538516998, + "train/contrastive_loss": 0.8996196985244751, + "train/negative_loss": 0.5515589118003845, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.34806081652641296, + "train/total_loss": 0.37549418210983276 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.11459163576364517, + "train/contrastive_loss": 0.2867501974105835, + "train/negative_loss": 0.2779722213745117, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.008777974173426628, + "train/total_loss": 0.17194166779518127 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.18750149011611938, + "train/contrastive_loss": 2.071375608444214, + "train/negative_loss": 1.2362457513809204, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 1.7680977582931519, - "train/total_loss": 0.9654660820960999 + "train/positive_loss": 0.8351298570632935, + "train/total_loss": 0.6017765998840332 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.22568556666374207, - "train/contrastive_loss": 4.7214035987854, - "train/negative_loss": 3.56019926071167, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.1612043380737305, - "train/total_loss": 1.1699663400650024 + "train/classification_loss": 0.2722088396549225, + "train/contrastive_loss": 3.3038153648376465, + "train/negative_loss": 1.9966479539871216, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 1.3071672916412354, + "train/total_loss": 0.9329719543457031 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.13532032072544098, + "train/contrastive_loss": 2.162440299987793, + "train/negative_loss": 1.180728554725647, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9817118048667908, + "train/total_loss": 0.5678083896636963 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.18387490510940552, + "train/contrastive_loss": 1.4897825717926025, + "train/negative_loss": 0.8728315234184265, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.6169509887695312, + "train/total_loss": 0.481831431388855 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.1634780913591385, + "train/contrastive_loss": 1.4458531141281128, + "train/negative_loss": 0.5584594011306763, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.8873937129974365, + "train/total_loss": 0.45264869928359985 + }, + { + "epoch": 8.450704225352112, + "step": 2400, + "train/classification_loss": 0.1681169867515564, + "train/contrastive_loss": 4.320793151855469, + "train/negative_loss": 4.320789813995361, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 3.218665369786322e-06, + "train/total_loss": 1.032275676727295 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.2741857171058655, - "train/contrastive_loss": 3.182663917541504, - "train/negative_loss": 1.7614647150039673, + "train/classification_loss": 0.17943213880062103, + "train/contrastive_loss": 1.8562180995941162, + "train/negative_loss": 0.84536212682724, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.421199083328247, - "train/total_loss": 0.9107185006141663 + "train/positive_loss": 1.010856032371521, + "train/total_loss": 0.5506757497787476 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.18686138093471527, - "train/contrastive_loss": 0.8023602962493896, - "train/negative_loss": 0.7612498998641968, + "train/classification_loss": 0.20423956215381622, + "train/contrastive_loss": 2.25396728515625, + "train/negative_loss": 1.5905145406723022, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.04111039265990257, - "train/total_loss": 0.3473334312438965 + "train/num_positives": 8, + "train/positive_loss": 0.6634528040885925, + "train/total_loss": 0.6550330519676208 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.15292412042617798, - "train/contrastive_loss": 1.3372981548309326, - "train/negative_loss": 0.6603885293006897, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6769095659255981, - "train/total_loss": 0.4203837513923645 + "train/classification_loss": 0.1618092656135559, + "train/contrastive_loss": 2.6421542167663574, + "train/negative_loss": 0.9217068552970886, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.7204474210739136, + "train/total_loss": 0.6902401447296143 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1403968781232834, - "train/contrastive_loss": 1.2715907096862793, - "train/negative_loss": 0.40703535079956055, - "train/num_negatives": 46, + "train/classification_loss": 0.25699126720428467, + "train/contrastive_loss": 1.65337336063385, + "train/negative_loss": 1.4641841650009155, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.864555299282074, - "train/total_loss": 0.39471501111984253 + "train/positive_loss": 0.18918918073177338, + "train/total_loss": 0.5876659154891968 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.22068142890930176, - "train/contrastive_loss": 1.5100187063217163, - "train/negative_loss": 1.5100187063217163, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.522685170173645 - }, - { - "epoch": 9.125475285171103, - "eval_exact_match_accuracy": 0.29333333333333333, - "eval_hamming_loss": 0.06767507002801121, - "eval_loss": 0.5685345530509949, - "eval_macro_f1": 0.2804456257177737, - "eval_macro_precision": 0.460310479181116, - "eval_macro_recall": 0.2232895912558417, - "eval_micro_f1": 0.5492537313432836, - "eval_micro_precision": 0.7982646420824295, - "eval_micro_recall": 0.41865756541524457, - "eval_runtime": 2.6311, - "eval_samples_per_second": 199.534, - "eval_steps_per_second": 25.084, + "train/classification_loss": 0.16687235236167908, + "train/contrastive_loss": 0.5587081909179688, + "train/negative_loss": 0.48641812801361084, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.07229007035493851, + "train/total_loss": 0.27861398458480835 + }, + { + "epoch": 8.450704225352112, + "eval_exact_match_accuracy": 0.2874779541446208, + "eval_hamming_loss": 0.0682643427741467, + "eval_loss": 0.5643488168716431, + "eval_macro_f1": 0.3535031028397779, + "eval_macro_precision": 0.5754891656934286, + "eval_macro_recall": 0.2853629307270238, + "eval_micro_f1": 0.5320056899004267, + "eval_micro_precision": 0.7991452991452992, + "eval_micro_recall": 0.39872068230277186, + "eval_runtime": 2.8456, + "eval_samples_per_second": 199.255, + "eval_steps_per_second": 24.951, "step": 2400 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.15201476216316223, - "train/contrastive_loss": 1.6372392177581787, - "train/negative_loss": 0.6625121831893921, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9747270941734314, - "train/total_loss": 0.4794626235961914 + "train/classification_loss": 0.14886359870433807, + "train/contrastive_loss": 0.9310144782066345, + "train/negative_loss": 0.8535827994346619, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.07743166387081146, + "train/total_loss": 0.3350664973258972 }, { - "epoch": 9.125475285171103, + "epoch": 8.450704225352112, "step": 2400, - "train/classification_loss": 0.1453404277563095, - "train/contrastive_loss": 0.32519280910491943, - "train/negative_loss": 0.25213736295700073, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 0.0730554386973381, - "train/total_loss": 0.2103789895772934 + "train/classification_loss": 0.13936017453670502, + "train/contrastive_loss": 0.7120563983917236, + "train/negative_loss": 0.6321664452552795, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0798899307847023, + "train/total_loss": 0.2817714512348175 }, { - "epoch": 9.315589353612168, - "grad_norm": 5.369113445281982, - "learning_rate": 1.9642770167427703e-05, - "loss": 0.6142, + "epoch": 8.626760563380282, + "grad_norm": 18.51525115966797, + "learning_rate": 1.9669344608879495e-05, + "loss": 0.7023, "step": 2450 }, { - "epoch": 9.315589353612168, + "epoch": 8.626760563380282, "step": 2450, - "train/classification_loss": 0.13813649117946625, - "train/contrastive_loss": 1.0321993827819824, - "train/negative_loss": 1.0290164947509766, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.0031829304061830044, - "train/total_loss": 0.344576358795166 + "train/classification_loss": 0.11917033046483994, + "train/contrastive_loss": 0.31866520643234253, + "train/negative_loss": 0.22773566842079163, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0909295380115509, + "train/total_loss": 0.18290337920188904 }, { - "epoch": 9.315589353612168, + "epoch": 8.626760563380282, "step": 2450, - "train/classification_loss": 0.18372885882854462, - "train/contrastive_loss": 2.2121951580047607, - "train/negative_loss": 0.7466533780097961, - "train/num_negatives": 36, - "train/num_positives": 8, - "train/positive_loss": 1.4655418395996094, - "train/total_loss": 0.626167893409729 + "train/classification_loss": 0.13346493244171143, + "train/contrastive_loss": 0.7950259447097778, + "train/negative_loss": 0.5877374410629272, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.20728850364685059, + "train/total_loss": 0.29247012734413147 }, { - "epoch": 9.505703422053232, - "grad_norm": 5.927659034729004, - "learning_rate": 1.9635159817351597e-05, - "loss": 0.6507, + "epoch": 8.80281690140845, + "grad_norm": 10.050371170043945, + "learning_rate": 1.9662297392529953e-05, + "loss": 0.6547, "step": 2500 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.2708266079425812, - "train/contrastive_loss": 2.025637626647949, - "train/negative_loss": 0.5830605626106262, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.4425770044326782, - "train/total_loss": 0.6759541034698486 + "train/classification_loss": 0.2511644661426544, + "train/contrastive_loss": 2.6396262645721436, + "train/negative_loss": 1.6967718601226807, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9428543448448181, + "train/total_loss": 0.7790896892547607 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.18441766500473022, - "train/contrastive_loss": 1.93165922164917, - "train/negative_loss": 1.0458091497421265, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.8858500123023987, - "train/total_loss": 0.5707495212554932 + "train/classification_loss": 0.24657103419303894, + "train/contrastive_loss": 0.7728821635246277, + "train/negative_loss": 0.6604555249214172, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.11242662370204926, + "train/total_loss": 0.4011474847793579 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.15823614597320557, - "train/contrastive_loss": 1.0672475099563599, - "train/negative_loss": 0.24568326771259308, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.821564257144928, - "train/total_loss": 0.371685653924942 + "train/classification_loss": 0.2421797811985016, + "train/contrastive_loss": 2.3896260261535645, + "train/negative_loss": 1.2844914197921753, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1051344871520996, + "train/total_loss": 0.720104992389679 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.18432047963142395, - "train/contrastive_loss": 3.144784688949585, - "train/negative_loss": 1.6950488090515137, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4497358798980713, - "train/total_loss": 0.8132774829864502 + "train/classification_loss": 0.14494135975837708, + "train/contrastive_loss": 1.591440200805664, + "train/negative_loss": 1.1758092641830444, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.41563090682029724, + "train/total_loss": 0.4632294178009033 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.10781760513782501, - "train/contrastive_loss": 0.7046509385108948, - "train/negative_loss": 0.6596760153770447, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.04497490078210831, - "train/total_loss": 0.2487477958202362 + "train/classification_loss": 0.21130205690860748, + "train/contrastive_loss": 2.506287097930908, + "train/negative_loss": 2.0280110836029053, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.47827598452568054, + "train/total_loss": 0.7125594615936279 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.17165273427963257, - "train/contrastive_loss": 2.0411291122436523, - "train/negative_loss": 1.4339168071746826, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.6072121858596802, - "train/total_loss": 0.579878568649292 + "train/classification_loss": 0.20617571473121643, + "train/contrastive_loss": 1.9634813070297241, + "train/negative_loss": 1.2506732940673828, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.7128080129623413, + "train/total_loss": 0.5988719463348389 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.20838482677936554, - "train/contrastive_loss": 1.2163511514663696, - "train/negative_loss": 0.9932559728622437, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.22309517860412598, - "train/total_loss": 0.4516550600528717 + "train/classification_loss": 0.1936262845993042, + "train/contrastive_loss": 2.0033059120178223, + "train/negative_loss": 0.8608787059783936, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.1424270868301392, + "train/total_loss": 0.5942875146865845 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.14467300474643707, - "train/contrastive_loss": 1.9120838642120361, - "train/negative_loss": 1.251225471496582, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6608584523200989, - "train/total_loss": 0.5270897746086121 + "train/classification_loss": 0.19313490390777588, + "train/contrastive_loss": 0.7414778470993042, + "train/negative_loss": 0.7409564852714539, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.000521378533449024, + "train/total_loss": 0.3414304852485657 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.14423280954360962, - "train/contrastive_loss": 0.9086791276931763, - "train/negative_loss": 0.8987156748771667, + "train/classification_loss": 0.1011158898472786, + "train/contrastive_loss": 0.35006284713745117, + "train/negative_loss": 0.3396986424922943, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.009963436052203178, - "train/total_loss": 0.3259686231613159 + "train/positive_loss": 0.010364211164414883, + "train/total_loss": 0.17112845182418823 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.3425733745098114, - "train/contrastive_loss": 4.3210320472717285, - "train/negative_loss": 2.002639055252075, + "train/classification_loss": 0.16592451930046082, + "train/contrastive_loss": 1.7435455322265625, + "train/negative_loss": 1.136543869972229, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 2.3183929920196533, - "train/total_loss": 1.2067798376083374 + "train/num_positives": 14, + "train/positive_loss": 0.6070016026496887, + "train/total_loss": 0.5146336555480957 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1780475527048111, - "train/contrastive_loss": 1.737654447555542, - "train/negative_loss": 1.4227817058563232, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.31487274169921875, - "train/total_loss": 0.5255784392356873 + "train/classification_loss": 0.1462712585926056, + "train/contrastive_loss": 1.435616135597229, + "train/negative_loss": 0.5031639933586121, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.9324521422386169, + "train/total_loss": 0.43339449167251587 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.10146190226078033, - "train/contrastive_loss": 0.6343109607696533, - "train/negative_loss": 0.39664238691329956, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.23766855895519257, - "train/total_loss": 0.22832410037517548 + "train/classification_loss": 0.18088997900485992, + "train/contrastive_loss": 1.6934937238693237, + "train/negative_loss": 1.6808782815933228, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.012615488842129707, + "train/total_loss": 0.5195887088775635 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1890408992767334, - "train/contrastive_loss": 3.6010823249816895, - "train/negative_loss": 2.3539376258850098, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.2471445798873901, - "train/total_loss": 0.9092573523521423 + "train/classification_loss": 0.19819100201129913, + "train/contrastive_loss": 3.67189359664917, + "train/negative_loss": 2.29703950881958, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3748542070388794, + "train/total_loss": 0.9325697422027588 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.13105274736881256, - "train/contrastive_loss": 2.766765594482422, - "train/negative_loss": 2.7623748779296875, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.004390786401927471, - "train/total_loss": 0.6844058632850647 + "train/classification_loss": 0.1696241945028305, + "train/contrastive_loss": 1.2580044269561768, + "train/negative_loss": 0.9411847591400146, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.3168196976184845, + "train/total_loss": 0.42122507095336914 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.12080449610948563, - "train/contrastive_loss": 1.8581289052963257, - "train/negative_loss": 1.499510407447815, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.35861849784851074, - "train/total_loss": 0.49243026971817017 + "train/classification_loss": 0.13428957760334015, + "train/contrastive_loss": 2.469491958618164, + "train/negative_loss": 0.8042869567871094, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.6652050018310547, + "train/total_loss": 0.6281879544258118 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.13615049421787262, - "train/contrastive_loss": 0.39384138584136963, - "train/negative_loss": 0.37963250279426575, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.014208870008587837, - "train/total_loss": 0.21491876244544983 + "train/classification_loss": 0.15965595841407776, + "train/contrastive_loss": 1.5159543752670288, + "train/negative_loss": 0.6359073519706726, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.8800470232963562, + "train/total_loss": 0.4628468453884125 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.23152752220630646, - "train/contrastive_loss": 2.5743813514709473, - "train/negative_loss": 1.1982271671295166, - "train/num_negatives": 40, + "train/classification_loss": 0.12364625930786133, + "train/contrastive_loss": 0.8296409249305725, + "train/negative_loss": 0.30147844552993774, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.3761543035507202, - "train/total_loss": 0.7464038133621216 + "train/positive_loss": 0.5281624794006348, + "train/total_loss": 0.28957444429397583 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.17302736639976501, - "train/contrastive_loss": 0.917982816696167, - "train/negative_loss": 0.18898332118988037, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7289994955062866, - "train/total_loss": 0.35662394762039185 + "train/classification_loss": 0.18789976835250854, + "train/contrastive_loss": 0.8999439477920532, + "train/negative_loss": 0.6030117869377136, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.2969321608543396, + "train/total_loss": 0.36788856983184814 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1780686378479004, - "train/contrastive_loss": 0.9326674342155457, - "train/negative_loss": 0.9302377700805664, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.002429660176858306, - "train/total_loss": 0.36460214853286743 + "train/classification_loss": 0.15312260389328003, + "train/contrastive_loss": 0.9006112813949585, + "train/negative_loss": 0.4755997657775879, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.425011545419693, + "train/total_loss": 0.33324486017227173 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.16189274191856384, - "train/contrastive_loss": 2.1664180755615234, - "train/negative_loss": 1.4997414350509644, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6666767001152039, - "train/total_loss": 0.5951763391494751 + "train/classification_loss": 0.206082284450531, + "train/contrastive_loss": 4.2448930740356445, + "train/negative_loss": 1.7870343923568726, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.4578585624694824, + "train/total_loss": 1.055060863494873 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.24343986809253693, - "train/contrastive_loss": 2.128925085067749, - "train/negative_loss": 0.4730595052242279, - "train/num_negatives": 44, + "train/classification_loss": 0.15332470834255219, + "train/contrastive_loss": 2.7012293338775635, + "train/negative_loss": 2.311882972717285, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.6558656692504883, - "train/total_loss": 0.6692249178886414 + "train/positive_loss": 0.3893464505672455, + "train/total_loss": 0.693570613861084 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.22716014087200165, - "train/contrastive_loss": 1.757094383239746, - "train/negative_loss": 1.1711466312408447, - "train/num_negatives": 44, + "train/classification_loss": 0.1317104548215866, + "train/contrastive_loss": 2.714829921722412, + "train/negative_loss": 2.0845723152160645, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.5859478116035461, - "train/total_loss": 0.5785790085792542 + "train/positive_loss": 0.6302576065063477, + "train/total_loss": 0.6746764779090881 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.11749795079231262, - "train/contrastive_loss": 0.8795303702354431, - "train/negative_loss": 0.2468094825744629, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6327208876609802, - "train/total_loss": 0.2934040427207947 + "train/classification_loss": 0.15104888379573822, + "train/contrastive_loss": 2.1891095638275146, + "train/negative_loss": 1.3497951030731201, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.8393144607543945, + "train/total_loss": 0.5888708233833313 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1347874402999878, - "train/contrastive_loss": 0.1747724413871765, - "train/negative_loss": 0.09611876308917999, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.07865368574857712, - "train/total_loss": 0.1697419285774231 + "train/classification_loss": 0.26691919565200806, + "train/contrastive_loss": 3.4873218536376953, + "train/negative_loss": 1.592253565788269, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.8950684070587158, + "train/total_loss": 0.964383602142334 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1027979850769043, - "train/contrastive_loss": 0.705227255821228, - "train/negative_loss": 0.6406439542770386, + "train/classification_loss": 0.17469654977321625, + "train/contrastive_loss": 2.040550947189331, + "train/negative_loss": 0.7673336863517761, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.06458333134651184, - "train/total_loss": 0.2438434362411499 + "train/num_positives": 10, + "train/positive_loss": 1.2732173204421997, + "train/total_loss": 0.5828067660331726 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.25482553243637085, - "train/contrastive_loss": 1.6842502355575562, - "train/negative_loss": 0.1609644591808319, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.5232857465744019, - "train/total_loss": 0.5916755795478821 + "train/classification_loss": 0.210176020860672, + "train/contrastive_loss": 1.7441418170928955, + "train/negative_loss": 1.0948737859725952, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.6492680311203003, + "train/total_loss": 0.5590044260025024 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.27704229950904846, - "train/contrastive_loss": 4.394126892089844, - "train/negative_loss": 1.6246694326400757, + "train/classification_loss": 0.19292020797729492, + "train/contrastive_loss": 1.745369791984558, + "train/negative_loss": 1.744639277458191, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 2.7694573402404785, - "train/total_loss": 1.1558676958084106 + "train/num_positives": 4, + "train/positive_loss": 0.0007304659811779857, + "train/total_loss": 0.5419942140579224 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.16650457680225372, - "train/contrastive_loss": 2.677478790283203, - "train/negative_loss": 2.154146432876587, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5233322381973267, - "train/total_loss": 0.7020003199577332 + "train/classification_loss": 0.16902956366539001, + "train/contrastive_loss": 0.20009179413318634, + "train/negative_loss": 0.14015941321849823, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.05993238091468811, + "train/total_loss": 0.20904792845249176 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.2028675526380539, - "train/contrastive_loss": 0.5896481275558472, - "train/negative_loss": 0.48385339975357056, - "train/num_negatives": 40, + "train/classification_loss": 0.265617698431015, + "train/contrastive_loss": 2.663512945175171, + "train/negative_loss": 1.1290005445480347, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.1057947427034378, - "train/total_loss": 0.3207971751689911 - }, - { - "epoch": 9.505703422053232, - "step": 2500, - "train/classification_loss": 0.20297126471996307, - "train/contrastive_loss": 0.7293708324432373, - "train/negative_loss": 0.5632634162902832, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.1661073863506317, - "train/total_loss": 0.3488454222679138 + "train/positive_loss": 1.5345124006271362, + "train/total_loss": 0.7983202934265137 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.12884081900119781, - "train/contrastive_loss": 1.380623698234558, - "train/negative_loss": 0.6703004837036133, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7103232145309448, - "train/total_loss": 0.4049655795097351 - }, - { - "epoch": 9.505703422053232, - "step": 2500, - "train/classification_loss": 0.23180840909481049, - "train/contrastive_loss": 3.5314230918884277, - "train/negative_loss": 2.0332067012786865, + "train/classification_loss": 0.18727409839630127, + "train/contrastive_loss": 0.918952465057373, + "train/negative_loss": 0.9178711771965027, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4982163906097412, - "train/total_loss": 0.9380930662155151 - }, - { - "epoch": 9.505703422053232, - "step": 2500, - "train/classification_loss": 0.23055104911327362, - "train/contrastive_loss": 0.7857694029808044, - "train/negative_loss": 0.7854960560798645, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.000273324636509642, - "train/total_loss": 0.3877049386501312 + "train/num_positives": 10, + "train/positive_loss": 0.0010813073022291064, + "train/total_loss": 0.37106460332870483 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.20539627969264984, - "train/contrastive_loss": 1.6583597660064697, - "train/negative_loss": 0.873618483543396, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.7847412824630737, - "train/total_loss": 0.537068247795105 + "train/classification_loss": 0.16883639991283417, + "train/contrastive_loss": 1.177332878112793, + "train/negative_loss": 1.0624253749847412, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.11490747332572937, + "train/total_loss": 0.4043029844760895 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.20502538979053497, - "train/contrastive_loss": 4.71287727355957, - "train/negative_loss": 2.7724616527557373, + "train/classification_loss": 0.16628685593605042, + "train/contrastive_loss": 2.399775505065918, + "train/negative_loss": 1.6184954643249512, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 1.9404157400131226, - "train/total_loss": 1.1476008892059326 + "train/positive_loss": 0.7812799215316772, + "train/total_loss": 0.6462419629096985 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1684514880180359, - "train/contrastive_loss": 3.7788357734680176, - "train/negative_loss": 1.5185967683792114, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.2602388858795166, - "train/total_loss": 0.9242186546325684 + "train/classification_loss": 0.17768938839435577, + "train/contrastive_loss": 1.727698802947998, + "train/negative_loss": 0.8660138845443726, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.8616849184036255, + "train/total_loss": 0.52322918176651 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.15273500978946686, - "train/contrastive_loss": 0.3167257010936737, - "train/negative_loss": 0.25415271520614624, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.06257299333810806, - "train/total_loss": 0.21608015894889832 + "train/classification_loss": 0.21600525081157684, + "train/contrastive_loss": 1.8556184768676758, + "train/negative_loss": 1.7665786743164062, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.08903981745243073, + "train/total_loss": 0.5871289372444153 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.17385460436344147, - "train/contrastive_loss": 0.7777055501937866, - "train/negative_loss": 0.7743061184883118, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.0033994214609265327, - "train/total_loss": 0.32939571142196655 + "train/classification_loss": 0.2321563959121704, + "train/contrastive_loss": 2.2539730072021484, + "train/negative_loss": 1.6598936319351196, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5940792560577393, + "train/total_loss": 0.6829509735107422 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.20539601147174835, - "train/contrastive_loss": 2.07822847366333, - "train/negative_loss": 1.7511762380599976, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.3270522356033325, - "train/total_loss": 0.6210417151451111 + "train/classification_loss": 0.13460731506347656, + "train/contrastive_loss": 2.105048656463623, + "train/negative_loss": 2.1049978733062744, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 5.0864673539763317e-05, + "train/total_loss": 0.555617094039917 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.18470783531665802, - "train/contrastive_loss": 1.8673293590545654, - "train/negative_loss": 1.832430124282837, + "train/classification_loss": 0.1841176301240921, + "train/contrastive_loss": 0.8083468675613403, + "train/negative_loss": 0.3539351522922516, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.03489918261766434, - "train/total_loss": 0.5581737160682678 + "train/num_positives": 8, + "train/positive_loss": 0.45441168546676636, + "train/total_loss": 0.345786988735199 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1684931516647339, - "train/contrastive_loss": 0.8547806143760681, - "train/negative_loss": 0.8105660676956177, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.04421452432870865, - "train/total_loss": 0.33944928646087646 + "train/classification_loss": 0.23715537786483765, + "train/contrastive_loss": 2.8935818672180176, + "train/negative_loss": 2.5387141704559326, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.35486775636672974, + "train/total_loss": 0.8158717751502991 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.17063768208026886, - "train/contrastive_loss": 2.4237563610076904, - "train/negative_loss": 1.9768431186676025, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.4469131529331207, - "train/total_loss": 0.6553889513015747 + "train/classification_loss": 0.20092280209064484, + "train/contrastive_loss": 0.7501943707466125, + "train/negative_loss": 0.5360543131828308, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.21414004266262054, + "train/total_loss": 0.35096168518066406 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.2035449892282486, - "train/contrastive_loss": 1.055041790008545, - "train/negative_loss": 0.5142273306846619, + "train/classification_loss": 0.27190569043159485, + "train/contrastive_loss": 2.9224958419799805, + "train/negative_loss": 2.2097790241241455, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.5408143997192383, - "train/total_loss": 0.41455334424972534 + "train/num_positives": 8, + "train/positive_loss": 0.712716817855835, + "train/total_loss": 0.8564049005508423 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1509382724761963, - "train/contrastive_loss": 2.0535173416137695, - "train/negative_loss": 1.1723241806030273, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.881193220615387, - "train/total_loss": 0.5616417527198792 + "train/classification_loss": 0.1484273076057434, + "train/contrastive_loss": 1.7271867990493774, + "train/negative_loss": 0.7041757106781006, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 1.0230110883712769, + "train/total_loss": 0.49386468529701233 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.13419045507907867, - "train/contrastive_loss": 0.6789491176605225, - "train/negative_loss": 0.2856418788433075, - "train/num_negatives": 40, + "train/classification_loss": 0.17107242345809937, + "train/contrastive_loss": 2.5170531272888184, + "train/negative_loss": 1.2578942775726318, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.39330723881721497, - "train/total_loss": 0.2699802815914154 + "train/positive_loss": 1.2591588497161865, + "train/total_loss": 0.674483060836792 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.29521769285202026, - "train/contrastive_loss": 1.7423346042633057, - "train/negative_loss": 1.0307906866073608, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.7115439772605896, - "train/total_loss": 0.6436846256256104 + "train/classification_loss": 0.1631156951189041, + "train/contrastive_loss": 0.9078551530838013, + "train/negative_loss": 0.9074746966362, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00038047906127758324, + "train/total_loss": 0.34468674659729004 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1103091835975647, - "train/contrastive_loss": 0.9092165231704712, - "train/negative_loss": 0.9092152118682861, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.3113030945532955e-06, - "train/total_loss": 0.2921524941921234 + "train/classification_loss": 0.2701141834259033, + "train/contrastive_loss": 1.2464015483856201, + "train/negative_loss": 1.2143200635910034, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.032081447541713715, + "train/total_loss": 0.5193945169448853 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1370704621076584, - "train/contrastive_loss": 0.5843364596366882, - "train/negative_loss": 0.48446545004844666, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.09987100213766098, - "train/total_loss": 0.2539377510547638 + "train/classification_loss": 0.16154073178768158, + "train/contrastive_loss": 1.0530773401260376, + "train/negative_loss": 1.0436376333236694, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.009439758025109768, + "train/total_loss": 0.37215620279312134 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.11835867911577225, - "train/contrastive_loss": 1.2734872102737427, - "train/negative_loss": 1.0902032852172852, + "train/classification_loss": 0.33457106351852417, + "train/contrastive_loss": 2.454972267150879, + "train/negative_loss": 1.4503281116485596, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.18328392505645752, - "train/total_loss": 0.3730561137199402 + "train/num_positives": 18, + "train/positive_loss": 1.0046441555023193, + "train/total_loss": 0.8255655169487 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.18986214697360992, - "train/contrastive_loss": 1.8498696088790894, - "train/negative_loss": 1.8358070850372314, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.014062575995922089, - "train/total_loss": 0.5598360896110535 + "train/classification_loss": 0.15463872253894806, + "train/contrastive_loss": 1.6894177198410034, + "train/negative_loss": 0.9045474529266357, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7848702669143677, + "train/total_loss": 0.49252229928970337 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1448887139558792, - "train/contrastive_loss": 1.9474719762802124, - "train/negative_loss": 1.077724575996399, + "train/classification_loss": 0.1873106211423874, + "train/contrastive_loss": 2.148073673248291, + "train/negative_loss": 1.8950856924057007, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8697474002838135, - "train/total_loss": 0.5343831181526184 + "train/positive_loss": 0.2529880404472351, + "train/total_loss": 0.6169253587722778 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.15421225130558014, - "train/contrastive_loss": 0.47489413619041443, - "train/negative_loss": 0.474039226770401, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.000854899175465107, - "train/total_loss": 0.2491910755634308 + "train/classification_loss": 0.25849273800849915, + "train/contrastive_loss": 3.0028321743011475, + "train/negative_loss": 3.002824306488037, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 7.867844033171423e-06, + "train/total_loss": 0.85905921459198 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.20038644969463348, - "train/contrastive_loss": 2.7810306549072266, - "train/negative_loss": 1.1097065210342407, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.6713241338729858, - "train/total_loss": 0.7565926313400269 + "train/classification_loss": 0.1882040947675705, + "train/contrastive_loss": 2.9411730766296387, + "train/negative_loss": 1.4729305505752563, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.4682424068450928, + "train/total_loss": 0.7764387130737305 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.22542965412139893, - "train/contrastive_loss": 3.4064879417419434, - "train/negative_loss": 2.754279136657715, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6522088050842285, - "train/total_loss": 0.9067272543907166 + "train/classification_loss": 0.12473208457231522, + "train/contrastive_loss": 0.3067686855792999, + "train/negative_loss": 0.2376350611448288, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.06913362443447113, + "train/total_loss": 0.18608582019805908 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.13997988402843475, - "train/contrastive_loss": 0.5593938231468201, - "train/negative_loss": 0.2740250825881958, + "train/classification_loss": 0.19111350178718567, + "train/contrastive_loss": 0.7253856658935547, + "train/negative_loss": 0.6835953593254089, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.28536874055862427, - "train/total_loss": 0.251858651638031 + "train/num_positives": 8, + "train/positive_loss": 0.041790325194597244, + "train/total_loss": 0.3361906409263611 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.16965703666210175, - "train/contrastive_loss": 3.18141770362854, - "train/negative_loss": 1.7196173667907715, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.4618003368377686, - "train/total_loss": 0.8059406280517578 + "train/classification_loss": 0.20824451744556427, + "train/contrastive_loss": 1.2593035697937012, + "train/negative_loss": 0.9832590818405151, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.2760445475578308, + "train/total_loss": 0.4601052403450012 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.23917052149772644, - "train/contrastive_loss": 2.800565481185913, - "train/negative_loss": 1.2786033153533936, - "train/num_negatives": 46, + "train/classification_loss": 0.29199981689453125, + "train/contrastive_loss": 3.435810089111328, + "train/negative_loss": 1.1639904975891113, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 1.5219621658325195, - "train/total_loss": 0.7992836236953735 + "train/positive_loss": 2.271819591522217, + "train/total_loss": 0.9791618585586548 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.1987878829240799, - "train/contrastive_loss": 2.250755786895752, - "train/negative_loss": 1.6175445318222046, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6332111358642578, - "train/total_loss": 0.6489390730857849 + "train/classification_loss": 0.14920663833618164, + "train/contrastive_loss": 1.0227805376052856, + "train/negative_loss": 0.2172389030456543, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8055416345596313, + "train/total_loss": 0.35376274585723877 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.18078388273715973, - "train/contrastive_loss": 3.3108179569244385, - "train/negative_loss": 2.98850154876709, + "train/classification_loss": 0.1258079558610916, + "train/contrastive_loss": 1.0636166334152222, + "train/negative_loss": 0.3190959393978119, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.32231631875038147, - "train/total_loss": 0.8429474830627441 + "train/positive_loss": 0.7445207238197327, + "train/total_loss": 0.3385312855243683 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.17183078825473785, + "train/contrastive_loss": 3.120384693145752, + "train/negative_loss": 0.8461884260177612, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.274196147918701, + "train/total_loss": 0.795907735824585 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.22721002995967865, - "train/contrastive_loss": 3.6816799640655518, - "train/negative_loss": 1.8761519193649292, + "train/classification_loss": 0.19278113543987274, + "train/contrastive_loss": 1.627281665802002, + "train/negative_loss": 0.9829041957855225, "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.6443774104118347, + "train/total_loss": 0.5182374715805054 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.19485071301460266, + "train/contrastive_loss": 0.9677084684371948, + "train/negative_loss": 0.7169820666313171, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.2507264316082001, + "train/total_loss": 0.3883923888206482 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.12035193294286728, + "train/contrastive_loss": 0.5098100304603577, + "train/negative_loss": 0.4969024658203125, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.012907564640045166, + "train/total_loss": 0.22231394052505493 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.18376772105693817, + "train/contrastive_loss": 2.4269652366638184, + "train/negative_loss": 1.1219836473464966, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 1.8055280447006226, - "train/total_loss": 0.9635460376739502 + "train/positive_loss": 1.3049817085266113, + "train/total_loss": 0.669160783290863 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.21519842743873596, - "train/contrastive_loss": 4.479783535003662, - "train/negative_loss": 3.470940113067627, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0088434219360352, - "train/total_loss": 1.1111551523208618 + "train/classification_loss": 0.2328861504793167, + "train/contrastive_loss": 1.6766852140426636, + "train/negative_loss": 1.5928853750228882, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 0.0837998166680336, + "train/total_loss": 0.5682231783866882 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.1382860541343689, + "train/contrastive_loss": 1.5263104438781738, + "train/negative_loss": 0.667002260684967, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.859308123588562, + "train/total_loss": 0.44354814291000366 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.1886458843946457, + "train/contrastive_loss": 1.6759822368621826, + "train/negative_loss": 1.0520031452178955, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.6239790916442871, + "train/total_loss": 0.5238423347473145 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.1672661006450653, + "train/contrastive_loss": 2.2461981773376465, + "train/negative_loss": 0.5392714738845825, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.7069268226623535, + "train/total_loss": 0.6165057420730591 + }, + { + "epoch": 8.80281690140845, + "step": 2500, + "train/classification_loss": 0.17669512331485748, + "train/contrastive_loss": 5.6372222900390625, + "train/negative_loss": 5.63722038269043, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.8477469438948901e-06, + "train/total_loss": 1.3041396141052246 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.2935626804828644, - "train/contrastive_loss": 4.341115951538086, - "train/negative_loss": 2.4350368976593018, + "train/classification_loss": 0.1775110512971878, + "train/contrastive_loss": 2.8417880535125732, + "train/negative_loss": 0.47931107878685, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.9060792922973633, - "train/total_loss": 1.1617858409881592 + "train/positive_loss": 2.3624770641326904, + "train/total_loss": 0.7458686828613281 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.17160949110984802, - "train/contrastive_loss": 0.9931501150131226, - "train/negative_loss": 0.98577880859375, + "train/classification_loss": 0.21907341480255127, + "train/contrastive_loss": 3.106001377105713, + "train/negative_loss": 1.3382761478424072, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.007371308282017708, - "train/total_loss": 0.3702394962310791 + "train/num_positives": 8, + "train/positive_loss": 1.7677253484725952, + "train/total_loss": 0.8402736783027649 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.15771405398845673, - "train/contrastive_loss": 1.4235615730285645, - "train/negative_loss": 0.9576037526130676, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.46595776081085205, - "train/total_loss": 0.4424263834953308 + "train/classification_loss": 0.15186597406864166, + "train/contrastive_loss": 1.9121085405349731, + "train/negative_loss": 0.9349023103713989, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9772062301635742, + "train/total_loss": 0.534287691116333 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.13973362743854523, - "train/contrastive_loss": 1.4298356771469116, - "train/negative_loss": 0.35653555393218994, - "train/num_negatives": 46, + "train/classification_loss": 0.26104214787483215, + "train/contrastive_loss": 2.1074230670928955, + "train/negative_loss": 2.0602364540100098, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0733001232147217, - "train/total_loss": 0.4257007837295532 + "train/positive_loss": 0.047186508774757385, + "train/total_loss": 0.6825267672538757 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.2254442572593689, - "train/contrastive_loss": 1.5596047639846802, - "train/negative_loss": 1.5596047639846802, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.537365198135376 - }, - { - "epoch": 9.505703422053232, - "eval_exact_match_accuracy": 0.3314285714285714, - "eval_hamming_loss": 0.06476190476190476, - "eval_loss": 0.5637803077697754, - "eval_macro_f1": 0.3284634705827146, - "eval_macro_precision": 0.5954213830320978, - "eval_macro_recall": 0.25577848005396103, - "eval_micro_f1": 0.5731166912850812, - "eval_micro_precision": 0.8168421052631579, - "eval_micro_recall": 0.44141069397042093, - "eval_runtime": 2.6208, - "eval_samples_per_second": 200.32, - "eval_steps_per_second": 25.183, + "train/classification_loss": 0.15953369438648224, + "train/contrastive_loss": 0.5105753540992737, + "train/negative_loss": 0.5024698972702026, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.008105463348329067, + "train/total_loss": 0.2616487741470337 + }, + { + "epoch": 8.80281690140845, + "eval_exact_match_accuracy": 0.2874779541446208, + "eval_hamming_loss": 0.06805685237057786, + "eval_loss": 0.5672438144683838, + "eval_macro_f1": 0.3656328044139099, + "eval_macro_precision": 0.5700484562146668, + "eval_macro_recall": 0.2988843578849931, + "eval_micro_f1": 0.5406162464985994, + "eval_micro_precision": 0.7877551020408163, + "eval_micro_recall": 0.4115138592750533, + "eval_runtime": 2.8461, + "eval_samples_per_second": 199.217, + "eval_steps_per_second": 24.946, "step": 2500 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.14659835398197174, - "train/contrastive_loss": 0.2859551012516022, - "train/negative_loss": 0.26070132851600647, - "train/num_negatives": 22, - "train/num_positives": 24, - "train/positive_loss": 0.025253772735595703, - "train/total_loss": 0.2037893831729889 + "train/classification_loss": 0.09683547914028168, + "train/contrastive_loss": 0.24993473291397095, + "train/negative_loss": 0.23617425560951233, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.01376048382371664, + "train/total_loss": 0.14682242274284363 }, { - "epoch": 9.505703422053232, + "epoch": 8.80281690140845, "step": 2500, - "train/classification_loss": 0.24197712540626526, - "train/contrastive_loss": 2.152993679046631, - "train/negative_loss": 1.174340009689331, - "train/num_negatives": 32, - "train/num_positives": 10, - "train/positive_loss": 0.9786537289619446, - "train/total_loss": 0.672575831413269 + "train/classification_loss": 0.15611132979393005, + "train/contrastive_loss": 1.1421875953674316, + "train/negative_loss": 0.8174611926078796, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.324726402759552, + "train/total_loss": 0.3845488429069519 }, { - "epoch": 9.695817490494296, - "grad_norm": 6.922210693359375, - "learning_rate": 1.96275494672755e-05, - "loss": 0.6203, + "epoch": 8.97887323943662, + "grad_norm": 10.806668281555176, + "learning_rate": 1.9655250176180408e-05, + "loss": 0.6965, "step": 2550 }, { - "epoch": 9.695817490494296, + "epoch": 8.97887323943662, "step": 2550, - "train/classification_loss": 0.17781147360801697, - "train/contrastive_loss": 0.7463839650154114, - "train/negative_loss": 0.5875096917152405, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.1588742733001709, - "train/total_loss": 0.32708826661109924 + "train/classification_loss": 0.22458066046237946, + "train/contrastive_loss": 0.7480671405792236, + "train/negative_loss": 0.40531519055366516, + "train/num_negatives": 34, + "train/num_positives": 12, + "train/positive_loss": 0.34275197982788086, + "train/total_loss": 0.37419408559799194 }, { - "epoch": 9.695817490494296, + "epoch": 8.97887323943662, "step": 2550, - "train/classification_loss": 0.11165871471166611, - "train/contrastive_loss": 0.6961846351623535, - "train/negative_loss": 0.47317594289779663, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.22300872206687927, - "train/total_loss": 0.2508956491947174 + "train/classification_loss": 0.1722177416086197, + "train/contrastive_loss": 0.6076792478561401, + "train/negative_loss": 0.574845016002655, + "train/num_negatives": 28, + "train/num_positives": 22, + "train/positive_loss": 0.03283420950174332, + "train/total_loss": 0.29375359416007996 }, { - "epoch": 9.885931558935361, - "grad_norm": 8.875618934631348, - "learning_rate": 1.9619939117199394e-05, - "loss": 0.6684, + "epoch": 9.154929577464788, + "grad_norm": 9.524175643920898, + "learning_rate": 1.964820295983087e-05, + "loss": 0.6568, "step": 2600 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.29656562209129333, - "train/contrastive_loss": 1.9065977334976196, - "train/negative_loss": 0.8473290205001831, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.0592687129974365, - "train/total_loss": 0.6778851747512817 + "train/classification_loss": 0.24628448486328125, + "train/contrastive_loss": 2.4654972553253174, + "train/negative_loss": 1.4616281986236572, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0038690567016602, + "train/total_loss": 0.7393839359283447 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.19247716665267944, - "train/contrastive_loss": 1.8388125896453857, - "train/negative_loss": 1.335018277168274, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5037943124771118, - "train/total_loss": 0.5602396726608276 + "train/classification_loss": 0.23898032307624817, + "train/contrastive_loss": 0.7137899994850159, + "train/negative_loss": 0.48506832122802734, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.22872166335582733, + "train/total_loss": 0.3817383050918579 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1876644790172577, - "train/contrastive_loss": 1.0201715230941772, - "train/negative_loss": 0.2376278042793274, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.7825437188148499, - "train/total_loss": 0.39169877767562866 + "train/classification_loss": 0.24360999464988708, + "train/contrastive_loss": 2.752887487411499, + "train/negative_loss": 1.7477415800094604, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.0051459074020386, + "train/total_loss": 0.7941875457763672 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.21298527717590332, - "train/contrastive_loss": 2.4026987552642822, - "train/negative_loss": 1.6160497665405273, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.7866490483283997, - "train/total_loss": 0.6935250759124756 + "train/classification_loss": 0.14797106385231018, + "train/contrastive_loss": 2.684443950653076, + "train/negative_loss": 1.6355658769607544, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.0488781929016113, + "train/total_loss": 0.6848598718643188 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.11778660118579865, - "train/contrastive_loss": 0.8211440443992615, - "train/negative_loss": 0.5717882513999939, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.24935580790042877, - "train/total_loss": 0.2820154130458832 + "train/classification_loss": 0.19469140470027924, + "train/contrastive_loss": 2.277411699295044, + "train/negative_loss": 1.906540870666504, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.3708707392215729, + "train/total_loss": 0.6501737236976624 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.18624909222126007, - "train/contrastive_loss": 2.1136913299560547, - "train/negative_loss": 1.1879247426986694, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.9257665276527405, - "train/total_loss": 0.6089873909950256 + "train/classification_loss": 0.19751551747322083, + "train/contrastive_loss": 2.7453670501708984, + "train/negative_loss": 1.3876423835754395, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.3577245473861694, + "train/total_loss": 0.746588945388794 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.23874695599079132, - "train/contrastive_loss": 1.7688908576965332, - "train/negative_loss": 1.1315724849700928, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.6373183727264404, - "train/total_loss": 0.5925251245498657 + "train/classification_loss": 0.2012830525636673, + "train/contrastive_loss": 2.037076234817505, + "train/negative_loss": 1.1387380361557007, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.8983381986618042, + "train/total_loss": 0.608698308467865 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15093456208705902, - "train/contrastive_loss": 2.3175013065338135, - "train/negative_loss": 2.087660312652588, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.22984106838703156, - "train/total_loss": 0.6144348382949829 + "train/classification_loss": 0.19069236516952515, + "train/contrastive_loss": 0.9895957112312317, + "train/negative_loss": 0.9894549250602722, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00014079608081374317, + "train/total_loss": 0.38861149549484253 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15519070625305176, - "train/contrastive_loss": 1.6411545276641846, - "train/negative_loss": 1.4045480489730835, + "train/classification_loss": 0.09525246173143387, + "train/contrastive_loss": 0.8819663524627686, + "train/negative_loss": 0.5683714151382446, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.23660652339458466, - "train/total_loss": 0.4834216237068176 + "train/positive_loss": 0.31359490752220154, + "train/total_loss": 0.271645724773407 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.32453209161758423, - "train/contrastive_loss": 2.722510576248169, - "train/negative_loss": 1.371407389640808, + "train/classification_loss": 0.17532993853092194, + "train/contrastive_loss": 1.8370440006256104, + "train/negative_loss": 1.2459131479263306, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3511031866073608, - "train/total_loss": 0.8690342307090759 + "train/num_positives": 14, + "train/positive_loss": 0.5911308526992798, + "train/total_loss": 0.5427387356758118 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.17034685611724854, - "train/contrastive_loss": 1.7864702939987183, - "train/negative_loss": 1.3108986616134644, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.4755716323852539, - "train/total_loss": 0.5276409387588501 + "train/classification_loss": 0.1475764960050583, + "train/contrastive_loss": 1.6424684524536133, + "train/negative_loss": 0.6133848428726196, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.0290836095809937, + "train/total_loss": 0.4760701656341553 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.12166940420866013, - "train/contrastive_loss": 1.8217546939849854, - "train/negative_loss": 0.5107438564300537, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.3110108375549316, - "train/total_loss": 0.48602035641670227 + "train/classification_loss": 0.18745386600494385, + "train/contrastive_loss": 1.9108036756515503, + "train/negative_loss": 1.565867304801941, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.344936341047287, + "train/total_loss": 0.5696146488189697 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.19335883855819702, - "train/contrastive_loss": 3.4853243827819824, - "train/negative_loss": 2.073427677154541, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4118967056274414, - "train/total_loss": 0.8904237151145935 + "train/classification_loss": 0.19530166685581207, + "train/contrastive_loss": 3.8807806968688965, + "train/negative_loss": 2.0134706497192383, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.8673100471496582, + "train/total_loss": 0.9714577794075012 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.11932893097400665, - "train/contrastive_loss": 2.2246897220611572, - "train/negative_loss": 2.2208569049835205, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0038328261580318213, - "train/total_loss": 0.5642668604850769 + "train/classification_loss": 0.16424857079982758, + "train/contrastive_loss": 1.0744452476501465, + "train/negative_loss": 0.5899219512939453, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.48452332615852356, + "train/total_loss": 0.37913763523101807 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.11697562783956528, - "train/contrastive_loss": 1.1809751987457275, - "train/negative_loss": 1.0619134902954102, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.11906168609857559, - "train/total_loss": 0.3531706631183624 + "train/classification_loss": 0.14020979404449463, + "train/contrastive_loss": 2.635652780532837, + "train/negative_loss": 0.7812339663505554, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.8544187545776367, + "train/total_loss": 0.6673403382301331 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.13384760916233063, - "train/contrastive_loss": 0.8855656385421753, - "train/negative_loss": 0.5536890029907227, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.33187660574913025, - "train/total_loss": 0.3109607398509979 + "train/classification_loss": 0.1672203689813614, + "train/contrastive_loss": 1.307839274406433, + "train/negative_loss": 0.6420754194259644, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.6657638549804688, + "train/total_loss": 0.4287882447242737 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.24009336531162262, - "train/contrastive_loss": 2.6937241554260254, - "train/negative_loss": 1.4248874187469482, - "train/num_negatives": 40, + "train/classification_loss": 0.13216516375541687, + "train/contrastive_loss": 1.2569119930267334, + "train/negative_loss": 0.5905213356018066, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.2688367366790771, - "train/total_loss": 0.7788382172584534 + "train/positive_loss": 0.6663906574249268, + "train/total_loss": 0.3835475742816925 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.19232861697673798, - "train/contrastive_loss": 1.3851382732391357, - "train/negative_loss": 0.4147651195526123, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.9703731536865234, - "train/total_loss": 0.4693562984466553 + "train/classification_loss": 0.18154656887054443, + "train/contrastive_loss": 0.45820435881614685, + "train/negative_loss": 0.353636234998703, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.10456812381744385, + "train/total_loss": 0.27318745851516724 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.16710811853408813, - "train/contrastive_loss": 0.5948719382286072, - "train/negative_loss": 0.5937320590019226, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0011398715432733297, - "train/total_loss": 0.28608250617980957 + "train/classification_loss": 0.15409497916698456, + "train/contrastive_loss": 1.564359188079834, + "train/negative_loss": 0.5728989839553833, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.9914602637290955, + "train/total_loss": 0.46696680784225464 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.16234229505062103, - "train/contrastive_loss": 2.4573988914489746, - "train/negative_loss": 1.6317636966705322, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8256351947784424, - "train/total_loss": 0.6538220643997192 + "train/classification_loss": 0.21266396343708038, + "train/contrastive_loss": 2.9230458736419678, + "train/negative_loss": 1.4068803787231445, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.5161654949188232, + "train/total_loss": 0.7972731590270996 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.22423763573169708, - "train/contrastive_loss": 1.668856143951416, - "train/negative_loss": 0.3533918261528015, - "train/num_negatives": 44, + "train/classification_loss": 0.13373976945877075, + "train/contrastive_loss": 1.6649099588394165, + "train/negative_loss": 1.5701851844787598, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3154643774032593, - "train/total_loss": 0.5580088496208191 + "train/positive_loss": 0.09472475200891495, + "train/total_loss": 0.466721773147583 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.2446756362915039, - "train/contrastive_loss": 1.845736026763916, - "train/negative_loss": 1.349969506263733, - "train/num_negatives": 44, + "train/classification_loss": 0.13529695570468903, + "train/contrastive_loss": 3.0700488090515137, + "train/negative_loss": 1.8356618881225586, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.49576646089553833, - "train/total_loss": 0.6138228178024292 + "train/positive_loss": 1.234386920928955, + "train/total_loss": 0.7493067383766174 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1560017317533493, - "train/contrastive_loss": 2.0918211936950684, - "train/negative_loss": 0.5444230437278748, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.5473980903625488, - "train/total_loss": 0.5743659734725952 + "train/classification_loss": 0.15869060158729553, + "train/contrastive_loss": 2.246107339859009, + "train/negative_loss": 0.882771372795105, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.3633359670639038, + "train/total_loss": 0.6079120635986328 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.13829383254051208, - "train/contrastive_loss": 0.39930641651153564, - "train/negative_loss": 0.32361871004104614, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.0756876990199089, - "train/total_loss": 0.2181551158428192 + "train/classification_loss": 0.25418511033058167, + "train/contrastive_loss": 3.2660160064697266, + "train/negative_loss": 1.8137931823730469, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.4522228240966797, + "train/total_loss": 0.9073883295059204 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.10825981944799423, - "train/contrastive_loss": 1.0709753036499023, - "train/negative_loss": 0.8598436117172241, + "train/classification_loss": 0.18978899717330933, + "train/contrastive_loss": 2.1697194576263428, + "train/negative_loss": 0.8105581998825073, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.21113170683383942, - "train/total_loss": 0.32245486974716187 + "train/num_positives": 10, + "train/positive_loss": 1.3591612577438354, + "train/total_loss": 0.6237329244613647 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.2805103063583374, - "train/contrastive_loss": 1.8746013641357422, - "train/negative_loss": 0.5929605960845947, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2816407680511475, - "train/total_loss": 0.6554305553436279 + "train/classification_loss": 0.20158325135707855, + "train/contrastive_loss": 1.7320866584777832, + "train/negative_loss": 1.474867820739746, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.2572188675403595, + "train/total_loss": 0.5480005741119385 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.26198163628578186, - "train/contrastive_loss": 3.387484550476074, - "train/negative_loss": 1.782851219177246, + "train/classification_loss": 0.19087320566177368, + "train/contrastive_loss": 1.4457511901855469, + "train/negative_loss": 1.4266146421432495, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.6046333312988281, - "train/total_loss": 0.9394785165786743 + "train/num_positives": 4, + "train/positive_loss": 0.019136596471071243, + "train/total_loss": 0.48002344369888306 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1664089858531952, - "train/contrastive_loss": 2.608822822570801, - "train/negative_loss": 1.9956750869750977, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.6131478548049927, - "train/total_loss": 0.6881735324859619 + "train/classification_loss": 0.1796512007713318, + "train/contrastive_loss": 0.326382040977478, + "train/negative_loss": 0.26966819167137146, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.05671383813023567, + "train/total_loss": 0.24492761492729187 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.19842618703842163, - "train/contrastive_loss": 0.8147100210189819, - "train/negative_loss": 0.5882883071899414, - "train/num_negatives": 40, + "train/classification_loss": 0.24396435916423798, + "train/contrastive_loss": 2.816596508026123, + "train/negative_loss": 1.7620964050292969, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.22642169892787933, - "train/total_loss": 0.36136817932128906 - }, - { - "epoch": 9.885931558935361, - "step": 2600, - "train/classification_loss": 0.21570129692554474, - "train/contrastive_loss": 1.0830073356628418, - "train/negative_loss": 0.8541463613510132, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2288610190153122, - "train/total_loss": 0.4323027729988098 - }, - { - "epoch": 9.885931558935361, - "step": 2600, - "train/classification_loss": 0.14770914614200592, - "train/contrastive_loss": 1.969111442565918, - "train/negative_loss": 0.9602376818656921, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.0088738203048706, - "train/total_loss": 0.5415314435958862 + "train/positive_loss": 1.0545001029968262, + "train/total_loss": 0.8072836995124817 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.22830671072006226, - "train/contrastive_loss": 2.0414857864379883, - "train/negative_loss": 1.2080694437026978, + "train/classification_loss": 0.17636483907699585, + "train/contrastive_loss": 0.4791860580444336, + "train/negative_loss": 0.4780164659023285, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8334162831306458, - "train/total_loss": 0.636603832244873 + "train/num_positives": 10, + "train/positive_loss": 0.0011696013389155269, + "train/total_loss": 0.2722020447254181 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.2509337067604065, - "train/contrastive_loss": 1.083841323852539, - "train/negative_loss": 1.0832983255386353, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005429668817669153, - "train/total_loss": 0.4677019715309143 + "train/classification_loss": 0.18084284663200378, + "train/contrastive_loss": 1.3591601848602295, + "train/negative_loss": 1.2169331312179565, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.14222702383995056, + "train/total_loss": 0.45267489552497864 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.20231537520885468, - "train/contrastive_loss": 1.369246244430542, - "train/negative_loss": 1.0609307289123535, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.3083155155181885, - "train/total_loss": 0.47616463899612427 + "train/classification_loss": 0.1617814600467682, + "train/contrastive_loss": 3.6317224502563477, + "train/negative_loss": 2.2193636894226074, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.4123586416244507, + "train/total_loss": 0.888126015663147 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.17808197438716888, - "train/contrastive_loss": 2.669933319091797, - "train/negative_loss": 1.9654133319854736, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.704520046710968, - "train/total_loss": 0.7120686769485474 + "train/classification_loss": 0.1851709932088852, + "train/contrastive_loss": 1.976389765739441, + "train/negative_loss": 1.21761953830719, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.758770227432251, + "train/total_loss": 0.5804489254951477 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.17015060782432556, - "train/contrastive_loss": 3.530930519104004, - "train/negative_loss": 1.1431547403335571, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.3877758979797363, - "train/total_loss": 0.8763366937637329 + "train/classification_loss": 0.20561179518699646, + "train/contrastive_loss": 2.7897727489471436, + "train/negative_loss": 1.7173573970794678, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 1.0724153518676758, + "train/total_loss": 0.7635663747787476 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.14904072880744934, - "train/contrastive_loss": 1.0763500928878784, - "train/negative_loss": 0.7674264907836914, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.308923602104187, - "train/total_loss": 0.36431074142456055 + "train/classification_loss": 0.22046226263046265, + "train/contrastive_loss": 1.4839712381362915, + "train/negative_loss": 0.8525365591049194, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.6314346790313721, + "train/total_loss": 0.517256498336792 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.17352311313152313, - "train/contrastive_loss": 0.9794837236404419, - "train/negative_loss": 0.9586575031280518, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.02082623727619648, - "train/total_loss": 0.3694198727607727 + "train/classification_loss": 0.1314994841814041, + "train/contrastive_loss": 1.818369746208191, + "train/negative_loss": 1.8179841041564941, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.0003856798866763711, + "train/total_loss": 0.49517345428466797 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.19916851818561554, - "train/contrastive_loss": 1.339439868927002, - "train/negative_loss": 1.3340437412261963, + "train/classification_loss": 0.18952886760234833, + "train/contrastive_loss": 1.2846763134002686, + "train/negative_loss": 0.6666244268417358, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.005396074615418911, - "train/total_loss": 0.4670565128326416 + "train/positive_loss": 0.6180518865585327, + "train/total_loss": 0.4464641213417053 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1701011061668396, - "train/contrastive_loss": 1.6125702857971191, - "train/negative_loss": 1.6103378534317017, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0022324188612401485, - "train/total_loss": 0.4926151633262634 + "train/classification_loss": 0.2132207304239273, + "train/contrastive_loss": 2.0742974281311035, + "train/negative_loss": 1.8339942693710327, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.24030321836471558, + "train/total_loss": 0.6280802488327026 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1682114601135254, - "train/contrastive_loss": 0.8572881817817688, - "train/negative_loss": 0.7249778509140015, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.13231033086776733, - "train/total_loss": 0.3396691083908081 + "train/classification_loss": 0.1913914680480957, + "train/contrastive_loss": 1.423677682876587, + "train/negative_loss": 0.5711107850074768, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.8525668382644653, + "train/total_loss": 0.4761269986629486 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.20694273710250854, - "train/contrastive_loss": 2.0961098670959473, - "train/negative_loss": 1.4073526859283447, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.6887571215629578, - "train/total_loss": 0.6261646747589111 + "train/classification_loss": 0.23982155323028564, + "train/contrastive_loss": 3.3509202003479004, + "train/negative_loss": 2.2825989723205566, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 1.0683211088180542, + "train/total_loss": 0.9100056290626526 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.22106494009494781, - "train/contrastive_loss": 0.8940525054931641, - "train/negative_loss": 0.46205052733421326, + "train/classification_loss": 0.14049109816551208, + "train/contrastive_loss": 1.6200203895568848, + "train/negative_loss": 0.668586254119873, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.9514341354370117, + "train/total_loss": 0.4644951820373535 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.20000284910202026, + "train/contrastive_loss": 2.8137998580932617, + "train/negative_loss": 1.6145503520965576, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.4320020079612732, - "train/total_loss": 0.3998754620552063 + "train/num_positives": 14, + "train/positive_loss": 1.1992496252059937, + "train/total_loss": 0.7627628445625305 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15100041031837463, - "train/contrastive_loss": 3.8082435131073, - "train/negative_loss": 1.6097900867462158, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.198453426361084, - "train/total_loss": 0.9126491546630859 + "train/classification_loss": 0.1838768720626831, + "train/contrastive_loss": 0.7084023356437683, + "train/negative_loss": 0.7078876495361328, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0005146655021235347, + "train/total_loss": 0.3255573511123657 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.23325423896312714, + "train/contrastive_loss": 1.3782320022583008, + "train/negative_loss": 1.2698296308517456, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.10840240120887756, + "train/total_loss": 0.5089006423950195 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15291233360767365, - "train/contrastive_loss": 1.0744211673736572, - "train/negative_loss": 0.6107544898986816, + "train/classification_loss": 0.1684018224477768, + "train/contrastive_loss": 1.2575197219848633, + "train/negative_loss": 0.8483104705810547, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.463666707277298, - "train/total_loss": 0.36779657006263733 + "train/num_positives": 12, + "train/positive_loss": 0.4092091917991638, + "train/total_loss": 0.41990578174591064 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.2813280522823334, - "train/contrastive_loss": 1.7543962001800537, - "train/negative_loss": 1.0565946102142334, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.6978015303611755, - "train/total_loss": 0.6322072744369507 + "train/classification_loss": 0.32005971670150757, + "train/contrastive_loss": 2.315727710723877, + "train/negative_loss": 1.217613935470581, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 1.0981138944625854, + "train/total_loss": 0.7832052707672119 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.1508641541004181, + "train/contrastive_loss": 1.903778076171875, + "train/negative_loss": 1.145056128501892, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7587219476699829, + "train/total_loss": 0.5316197872161865 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.1702166199684143, + "train/contrastive_loss": 2.458134174346924, + "train/negative_loss": 2.1708731651306152, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.2872610092163086, + "train/total_loss": 0.6618434190750122 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.10040995478630066, - "train/contrastive_loss": 0.2804360091686249, - "train/negative_loss": 0.28043198585510254, + "train/classification_loss": 0.2776569724082947, + "train/contrastive_loss": 2.454988956451416, + "train/negative_loss": 2.454987049102783, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 4.023323526780587e-06, - "train/total_loss": 0.15649715065956116 + "train/num_positives": 2, + "train/positive_loss": 1.9073504518019035e-06, + "train/total_loss": 0.7686547636985779 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15895678102970123, - "train/contrastive_loss": 1.4584732055664062, - "train/negative_loss": 0.9318289756774902, - "train/num_negatives": 38, + "train/classification_loss": 0.19200481474399567, + "train/contrastive_loss": 3.16558837890625, + "train/negative_loss": 1.7555313110351562, + "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.526644229888916, - "train/total_loss": 0.4506514072418213 + "train/positive_loss": 1.4100570678710938, + "train/total_loss": 0.8251224756240845 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.12303021550178528, - "train/contrastive_loss": 1.5629931688308716, - "train/negative_loss": 1.0089807510375977, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.5540124177932739, - "train/total_loss": 0.43562886118888855 + "train/classification_loss": 0.17200742661952972, + "train/contrastive_loss": 0.1734849363565445, + "train/negative_loss": 0.11128728836774826, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.062197647988796234, + "train/total_loss": 0.20670440793037415 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.1919255554676056, - "train/contrastive_loss": 2.0042240619659424, - "train/negative_loss": 1.159101963043213, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.8451220393180847, - "train/total_loss": 0.5927703380584717 + "train/classification_loss": 0.18401043117046356, + "train/contrastive_loss": 0.8526637554168701, + "train/negative_loss": 0.8036697506904602, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.0489940345287323, + "train/total_loss": 0.35454317927360535 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.14806833863258362, - "train/contrastive_loss": 1.8277735710144043, - "train/negative_loss": 0.6899438500404358, - "train/num_negatives": 42, + "train/classification_loss": 0.20552721619606018, + "train/contrastive_loss": 1.5434834957122803, + "train/negative_loss": 1.0935592651367188, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 1.1378296613693237, - "train/total_loss": 0.513623058795929 + "train/positive_loss": 0.4499242901802063, + "train/total_loss": 0.5142239332199097 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.16825230419635773, - "train/contrastive_loss": 0.6596271991729736, - "train/negative_loss": 0.6044023633003235, - "train/num_negatives": 50, + "train/classification_loss": 0.29712027311325073, + "train/contrastive_loss": 2.836956262588501, + "train/negative_loss": 1.22115159034729, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 0.055224861949682236, - "train/total_loss": 0.30017775297164917 + "train/positive_loss": 1.615804672241211, + "train/total_loss": 0.8645115494728088 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.22660040855407715, - "train/contrastive_loss": 2.871744155883789, - "train/negative_loss": 1.4056675434112549, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.4660764932632446, - "train/total_loss": 0.8009492754936218 + "train/classification_loss": 0.15018239617347717, + "train/contrastive_loss": 0.6867485046386719, + "train/negative_loss": 0.39466720819473267, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.2920812666416168, + "train/total_loss": 0.28753209114074707 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.23490847647190094, - "train/contrastive_loss": 3.0515265464782715, - "train/negative_loss": 2.641211986541748, + "train/classification_loss": 0.13760094344615936, + "train/contrastive_loss": 1.0253562927246094, + "train/negative_loss": 0.35280925035476685, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.4103146195411682, - "train/total_loss": 0.845213770866394 + "train/positive_loss": 0.6725470423698425, + "train/total_loss": 0.342672199010849 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.15657001733779907, + "train/contrastive_loss": 1.6581045389175415, + "train/negative_loss": 0.7265006899833679, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.9316038489341736, + "train/total_loss": 0.4881909191608429 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.18820948898792267, + "train/contrastive_loss": 1.6809914112091064, + "train/negative_loss": 1.2318156957626343, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.44917571544647217, + "train/total_loss": 0.5244078040122986 + }, + { + "epoch": 9.154929577464788, + "step": 2600, + "train/classification_loss": 0.19504046440124512, + "train/contrastive_loss": 1.5233054161071777, + "train/negative_loss": 0.8468884825706482, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.6764168739318848, + "train/total_loss": 0.4997015595436096 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.20183400809764862, - "train/contrastive_loss": 1.4434902667999268, - "train/negative_loss": 0.5546771287918091, + "train/classification_loss": 0.11603426188230515, + "train/contrastive_loss": 0.686326265335083, + "train/negative_loss": 0.6851330995559692, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8888131976127625, - "train/total_loss": 0.4905320405960083 + "train/num_positives": 16, + "train/positive_loss": 0.0011931576300412416, + "train/total_loss": 0.2532995045185089 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.15030109882354736, - "train/contrastive_loss": 2.5441555976867676, - "train/negative_loss": 1.5772167444229126, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9669389724731445, - "train/total_loss": 0.6591322422027588 + "train/classification_loss": 0.17929503321647644, + "train/contrastive_loss": 2.505115509033203, + "train/negative_loss": 1.4139941930770874, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.0911211967468262, + "train/total_loss": 0.6803181171417236 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.25634264945983887, - "train/contrastive_loss": 2.937042713165283, - "train/negative_loss": 1.5873264074325562, + "train/classification_loss": 0.2623046338558197, + "train/contrastive_loss": 2.517824172973633, + "train/negative_loss": 1.8878295421600342, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.3497161865234375, - "train/total_loss": 0.8437511920928955 + "train/num_positives": 2, + "train/positive_loss": 0.6299946904182434, + "train/total_loss": 0.7658694982528687 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.20815333724021912, - "train/contrastive_loss": 3.415391206741333, - "train/negative_loss": 1.7082078456878662, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7071833610534668, - "train/total_loss": 0.8912315368652344 + "train/classification_loss": 0.14070263504981995, + "train/contrastive_loss": 2.1426305770874023, + "train/negative_loss": 1.158164381980896, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9844663143157959, + "train/total_loss": 0.5692287683486938 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.18672418594360352, - "train/contrastive_loss": 2.8869733810424805, - "train/negative_loss": 2.400569200515747, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4864041209220886, - "train/total_loss": 0.7641188502311707 + "train/classification_loss": 0.20783792436122894, + "train/contrastive_loss": 1.9898386001586914, + "train/negative_loss": 1.4247000217437744, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.565138578414917, + "train/total_loss": 0.6058056354522705 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.22713646292686462, - "train/contrastive_loss": 3.5589652061462402, - "train/negative_loss": 1.7264082431793213, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.8325570821762085, - "train/total_loss": 0.938929557800293 + "train/classification_loss": 0.17116650938987732, + "train/contrastive_loss": 2.381537914276123, + "train/negative_loss": 0.7003723382949829, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.6811656951904297, + "train/total_loss": 0.6474741101264954 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.24679554998874664, - "train/contrastive_loss": 3.4774606227874756, - "train/negative_loss": 2.4013895988464355, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.07607102394104, - "train/total_loss": 0.9422876834869385 + "train/classification_loss": 0.1755324751138687, + "train/contrastive_loss": 4.940838813781738, + "train/negative_loss": 4.9408369064331055, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.7762209836291731e-06, + "train/total_loss": 1.1637002229690552 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.2595456838607788, - "train/contrastive_loss": 3.622649669647217, - "train/negative_loss": 1.5947680473327637, + "train/classification_loss": 0.1799212545156479, + "train/contrastive_loss": 2.2084808349609375, + "train/negative_loss": 0.6446971297264099, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 2.027881622314453, - "train/total_loss": 0.9840756058692932 + "train/positive_loss": 1.5637837648391724, + "train/total_loss": 0.6216174364089966 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.16012418270111084, - "train/contrastive_loss": 0.8733224868774414, - "train/negative_loss": 0.8646421432495117, + "train/classification_loss": 0.212065190076828, + "train/contrastive_loss": 2.409909725189209, + "train/negative_loss": 1.4343678951263428, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.008680322207510471, - "train/total_loss": 0.3347886800765991 + "train/num_positives": 8, + "train/positive_loss": 0.9755419492721558, + "train/total_loss": 0.6940471529960632 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.16104799509048462, - "train/contrastive_loss": 1.2155524492263794, - "train/negative_loss": 0.5472664833068848, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6682859659194946, - "train/total_loss": 0.40415847301483154 + "train/classification_loss": 0.16545768082141876, + "train/contrastive_loss": 2.4944605827331543, + "train/negative_loss": 1.2136564254760742, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.28080415725708, + "train/total_loss": 0.6643497943878174 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.14784587919712067, - "train/contrastive_loss": 1.2956688404083252, - "train/negative_loss": 0.46407774090766907, - "train/num_negatives": 46, + "train/classification_loss": 0.25046831369400024, + "train/contrastive_loss": 2.2382519245147705, + "train/negative_loss": 2.17216157913208, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.8315911293029785, - "train/total_loss": 0.40697968006134033 + "train/positive_loss": 0.06609038263559341, + "train/total_loss": 0.6981186866760254 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.21698352694511414, - "train/contrastive_loss": 1.7252111434936523, - "train/negative_loss": 1.7252111434936523, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.562025785446167 - }, - { - "epoch": 9.885931558935361, - "eval_exact_match_accuracy": 0.2704761904761905, - "eval_hamming_loss": 0.06767507002801121, - "eval_loss": 0.5675710439682007, - "eval_macro_f1": 0.3026870648136204, - "eval_macro_precision": 0.6379566563467493, - "eval_macro_recall": 0.22018509506446052, - "eval_micro_f1": 0.5175718849840255, - "eval_micro_precision": 0.868632707774799, - "eval_micro_recall": 0.36860068259385664, - "eval_runtime": 2.6374, - "eval_samples_per_second": 199.061, - "eval_steps_per_second": 25.025, + "train/classification_loss": 0.17515461146831512, + "train/contrastive_loss": 2.257793426513672, + "train/negative_loss": 1.4612540006637573, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.7965394854545593, + "train/total_loss": 0.6267132759094238 + }, + { + "epoch": 9.154929577464788, + "eval_exact_match_accuracy": 0.2857142857142857, + "eval_hamming_loss": 0.06774561676522461, + "eval_loss": 0.5803765058517456, + "eval_macro_f1": 0.36105497113614543, + "eval_macro_precision": 0.5920739147438296, + "eval_macro_recall": 0.2825809175403302, + "eval_micro_f1": 0.5291997116077866, + "eval_micro_precision": 0.8173719376391982, + "eval_micro_recall": 0.39125799573560766, + "eval_runtime": 2.8565, + "eval_samples_per_second": 198.492, + "eval_steps_per_second": 24.855, "step": 2600 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.11975089460611343, - "train/contrastive_loss": 0.641180157661438, - "train/negative_loss": 0.5848935842514038, - "train/num_negatives": 46, + "train/classification_loss": 0.16526037454605103, + "train/contrastive_loss": 0.768109917640686, + "train/negative_loss": 0.6881194710731506, + "train/num_negatives": 44, "train/num_positives": 10, - "train/positive_loss": 0.05628659948706627, - "train/total_loss": 0.24798694252967834 + "train/positive_loss": 0.0799904614686966, + "train/total_loss": 0.3188823461532593 }, { - "epoch": 9.885931558935361, + "epoch": 9.154929577464788, "step": 2600, - "train/classification_loss": 0.17796041071414948, - "train/contrastive_loss": 0.9369737505912781, - "train/negative_loss": 0.8799952268600464, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.056978531181812286, - "train/total_loss": 0.36535516381263733 + "train/classification_loss": 0.14416836202144623, + "train/contrastive_loss": 1.0418167114257812, + "train/negative_loss": 0.7043741941452026, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.33744245767593384, + "train/total_loss": 0.35253170132637024 }, { - "epoch": 10.076045627376425, - "grad_norm": 4.023022174835205, - "learning_rate": 1.9612328767123288e-05, - "loss": 0.5893, + "epoch": 9.330985915492958, + "grad_norm": 9.925588607788086, + "learning_rate": 1.9641155743481327e-05, + "loss": 0.6413, "step": 2650 }, { - "epoch": 10.076045627376425, + "epoch": 9.330985915492958, "step": 2650, - "train/classification_loss": 0.12035703659057617, - "train/contrastive_loss": 0.44901368021965027, - "train/negative_loss": 0.37115854024887085, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.07785513997077942, - "train/total_loss": 0.2101597785949707 + "train/classification_loss": 0.1666610985994339, + "train/contrastive_loss": 0.6737055778503418, + "train/negative_loss": 0.40825411677360535, + "train/num_negatives": 38, + "train/num_positives": 18, + "train/positive_loss": 0.26545149087905884, + "train/total_loss": 0.30140221118927 }, { - "epoch": 10.076045627376425, + "epoch": 9.330985915492958, "step": 2650, - "train/classification_loss": 0.10297891497612, - "train/contrastive_loss": 0.5361615419387817, - "train/negative_loss": 0.3845428228378296, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.15161868929862976, - "train/total_loss": 0.21021121740341187 + "train/classification_loss": 0.12780001759529114, + "train/contrastive_loss": 0.5189247727394104, + "train/negative_loss": 0.5179834365844727, + "train/num_negatives": 36, + "train/num_positives": 20, + "train/positive_loss": 0.0009413353982381523, + "train/total_loss": 0.23158496618270874 }, { - "epoch": 10.26615969581749, - "grad_norm": 6.073227882385254, - "learning_rate": 1.9604718417047186e-05, - "loss": 0.604, + "epoch": 9.507042253521126, + "grad_norm": 8.174408912658691, + "learning_rate": 1.9634108527131786e-05, + "loss": 0.683, "step": 2700 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2949216961860657, - "train/contrastive_loss": 2.702465534210205, - "train/negative_loss": 1.8540551662445068, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8484102487564087, - "train/total_loss": 0.8354148268699646 + "train/classification_loss": 0.24618496000766754, + "train/contrastive_loss": 2.3181824684143066, + "train/negative_loss": 1.2733820676803589, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0448005199432373, + "train/total_loss": 0.7098214626312256 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.21968935430049896, - "train/contrastive_loss": 2.8710248470306396, - "train/negative_loss": 1.5602225065231323, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.3108023405075073, - "train/total_loss": 0.793894350528717 + "train/classification_loss": 0.24503618478775024, + "train/contrastive_loss": 0.7689821720123291, + "train/negative_loss": 0.7245208024978638, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.04446136951446533, + "train/total_loss": 0.39883261919021606 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.16940319538116455, - "train/contrastive_loss": 1.3214343786239624, - "train/negative_loss": 0.48005831241607666, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8413760662078857, - "train/total_loss": 0.43369007110595703 + "train/classification_loss": 0.23767878115177155, + "train/contrastive_loss": 2.9527482986450195, + "train/negative_loss": 1.5046037435531616, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.4481446743011475, + "train/total_loss": 0.8282284140586853 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.22618834674358368, - "train/contrastive_loss": 3.14735746383667, - "train/negative_loss": 1.6831586360931396, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4641987085342407, - "train/total_loss": 0.8556598424911499 + "train/classification_loss": 0.1498671919107437, + "train/contrastive_loss": 1.6355702877044678, + "train/negative_loss": 1.4459677934646606, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.18960247933864594, + "train/total_loss": 0.4769812822341919 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.13228942453861237, - "train/contrastive_loss": 1.9890316724777222, - "train/negative_loss": 1.185418725013733, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.8036129474639893, - "train/total_loss": 0.5300957560539246 + "train/classification_loss": 0.19280041754245758, + "train/contrastive_loss": 2.824444055557251, + "train/negative_loss": 2.696667432785034, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.1277766227722168, + "train/total_loss": 0.7576892375946045 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.18633848428726196, - "train/contrastive_loss": 2.623748302459717, - "train/negative_loss": 1.2860187292099, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.3377296924591064, - "train/total_loss": 0.7110881805419922 + "train/classification_loss": 0.2015714794397354, + "train/contrastive_loss": 2.269200325012207, + "train/negative_loss": 1.5796488523483276, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6895513534545898, + "train/total_loss": 0.6554115414619446 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2492387443780899, - "train/contrastive_loss": 2.846243143081665, - "train/negative_loss": 2.045464277267456, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.8007789254188538, - "train/total_loss": 0.8184873461723328 + "train/classification_loss": 0.1885913759469986, + "train/contrastive_loss": 1.3630460500717163, + "train/negative_loss": 0.7901840209960938, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.5728620290756226, + "train/total_loss": 0.4612005949020386 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17351770401000977, - "train/contrastive_loss": 2.7344155311584473, - "train/negative_loss": 1.9138165712356567, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.820598840713501, - "train/total_loss": 0.7204008102416992 + "train/classification_loss": 0.18265803158283234, + "train/contrastive_loss": 1.1519484519958496, + "train/negative_loss": 1.1519181728363037, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 3.027961793122813e-05, + "train/total_loss": 0.413047730922699 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15251557528972626, - "train/contrastive_loss": 2.167224407196045, - "train/negative_loss": 1.5709794759750366, + "train/classification_loss": 0.11412450671195984, + "train/contrastive_loss": 0.6452596783638, + "train/negative_loss": 0.45017990469932556, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.5962450504302979, - "train/total_loss": 0.5859604477882385 + "train/positive_loss": 0.19507978856563568, + "train/total_loss": 0.2431764453649521 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.30629029870033264, - "train/contrastive_loss": 3.0127954483032227, - "train/negative_loss": 1.5318022966384888, + "train/classification_loss": 0.20929855108261108, + "train/contrastive_loss": 2.9067678451538086, + "train/negative_loss": 2.310359239578247, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4809932708740234, - "train/total_loss": 0.9088493585586548 + "train/num_positives": 14, + "train/positive_loss": 0.5964085459709167, + "train/total_loss": 0.7906521558761597 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.18003572523593903, - "train/contrastive_loss": 2.4549362659454346, - "train/negative_loss": 1.6087826490402222, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8461536169052124, - "train/total_loss": 0.6710230112075806 + "train/classification_loss": 0.13452234864234924, + "train/contrastive_loss": 0.902179479598999, + "train/negative_loss": 0.753136396408081, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.14904308319091797, + "train/total_loss": 0.31495824456214905 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.1261659860610962, - "train/contrastive_loss": 1.8689945936203003, - "train/negative_loss": 0.47651562094688416, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.3924789428710938, - "train/total_loss": 0.4999649226665497 + "train/classification_loss": 0.17940469086170197, + "train/contrastive_loss": 3.0230913162231445, + "train/negative_loss": 1.974744200706482, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0483472347259521, + "train/total_loss": 0.7840229272842407 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20567089319229126, - "train/contrastive_loss": 4.514654636383057, - "train/negative_loss": 2.3004069328308105, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.214247703552246, - "train/total_loss": 1.1086018085479736 + "train/classification_loss": 0.21684207022190094, + "train/contrastive_loss": 4.046243667602539, + "train/negative_loss": 2.533534288406372, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.512709617614746, + "train/total_loss": 1.0260908603668213 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.10112864524126053, - "train/contrastive_loss": 1.5802361965179443, - "train/negative_loss": 1.5801550149917603, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 8.119695849018171e-05, - "train/total_loss": 0.41717588901519775 + "train/classification_loss": 0.15810632705688477, + "train/contrastive_loss": 1.295092225074768, + "train/negative_loss": 0.8452231287956238, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.4498691260814667, + "train/total_loss": 0.41712477803230286 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.12529538571834564, - "train/contrastive_loss": 1.7084649801254272, - "train/negative_loss": 0.6553754806518555, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.0530894994735718, - "train/total_loss": 0.46698838472366333 + "train/classification_loss": 0.13270686566829681, + "train/contrastive_loss": 2.3346595764160156, + "train/negative_loss": 0.6693814396858215, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.6652781963348389, + "train/total_loss": 0.5996387600898743 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.1447140872478485, - "train/contrastive_loss": 1.1550447940826416, - "train/negative_loss": 0.35852134227752686, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.7965235114097595, - "train/total_loss": 0.37572306394577026 + "train/classification_loss": 0.15910740196704865, + "train/contrastive_loss": 0.9473980665206909, + "train/negative_loss": 0.5109848976135254, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.4364131689071655, + "train/total_loss": 0.3485870361328125 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2438010275363922, - "train/contrastive_loss": 2.9337031841278076, - "train/negative_loss": 1.777907371520996, - "train/num_negatives": 40, + "train/classification_loss": 0.10971515625715256, + "train/contrastive_loss": 1.065409541130066, + "train/negative_loss": 0.6277315616607666, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.1557958126068115, - "train/total_loss": 0.830541729927063 + "train/positive_loss": 0.4376779794692993, + "train/total_loss": 0.3227970600128174 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.16402509808540344, - "train/contrastive_loss": 1.8250175714492798, - "train/negative_loss": 0.7464612722396851, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.0785562992095947, - "train/total_loss": 0.5290286540985107 + "train/classification_loss": 0.22380180656909943, + "train/contrastive_loss": 2.012408494949341, + "train/negative_loss": 0.6866670250892639, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.3257414102554321, + "train/total_loss": 0.6262835264205933 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15492069721221924, - "train/contrastive_loss": 1.0303562879562378, - "train/negative_loss": 1.0288066864013672, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.001549598528072238, - "train/total_loss": 0.3609919548034668 + "train/classification_loss": 0.14739564061164856, + "train/contrastive_loss": 0.718749463558197, + "train/negative_loss": 0.6504449248313904, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.06830452382564545, + "train/total_loss": 0.29114553332328796 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15241339802742004, - "train/contrastive_loss": 1.3987855911254883, - "train/negative_loss": 1.1106903553009033, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2880952060222626, - "train/total_loss": 0.4321705102920532 + "train/classification_loss": 0.20180334150791168, + "train/contrastive_loss": 3.0506796836853027, + "train/negative_loss": 1.5672178268432617, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.4834619760513306, + "train/total_loss": 0.8119392991065979 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.21975363790988922, - "train/contrastive_loss": 1.8838533163070679, - "train/negative_loss": 0.3946819007396698, - "train/num_negatives": 44, + "train/classification_loss": 0.13206076622009277, + "train/contrastive_loss": 2.2139627933502197, + "train/negative_loss": 2.194715738296509, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.4891713857650757, - "train/total_loss": 0.5965242981910706 + "train/positive_loss": 0.019246986135840416, + "train/total_loss": 0.5748533010482788 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2536977529525757, - "train/contrastive_loss": 2.919379234313965, - "train/negative_loss": 1.4839332103729248, - "train/num_negatives": 44, + "train/classification_loss": 0.13065706193447113, + "train/contrastive_loss": 2.7108256816864014, + "train/negative_loss": 2.2679407596588135, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 1.43544602394104, - "train/total_loss": 0.8375735878944397 + "train/positive_loss": 0.4428848624229431, + "train/total_loss": 0.6728222370147705 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.16020727157592773, - "train/contrastive_loss": 2.6388282775878906, - "train/negative_loss": 0.8714284896850586, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.767399787902832, - "train/total_loss": 0.6879729628562927 + "train/classification_loss": 0.16608917713165283, + "train/contrastive_loss": 2.4329495429992676, + "train/negative_loss": 1.4563369750976562, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.9766125679016113, + "train/total_loss": 0.6526790857315063 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.14238636195659637, - "train/contrastive_loss": 0.8349242806434631, - "train/negative_loss": 0.35877177119255066, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.4761525094509125, - "train/total_loss": 0.3093712329864502 + "train/classification_loss": 0.2685789167881012, + "train/contrastive_loss": 4.244009017944336, + "train/negative_loss": 2.465100049972534, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.7789090871810913, + "train/total_loss": 1.1173807382583618 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.09989036619663239, - "train/contrastive_loss": 1.578574299812317, - "train/negative_loss": 0.39708054065704346, + "train/classification_loss": 0.17535828053951263, + "train/contrastive_loss": 1.419189691543579, + "train/negative_loss": 1.1602553129196167, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.1814937591552734, - "train/total_loss": 0.41560524702072144 + "train/num_positives": 10, + "train/positive_loss": 0.2589344084262848, + "train/total_loss": 0.45919620990753174 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2924329936504364, - "train/contrastive_loss": 1.5425989627838135, - "train/negative_loss": 0.31160396337509155, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2309949398040771, - "train/total_loss": 0.6009528040885925 + "train/classification_loss": 0.21858078241348267, + "train/contrastive_loss": 3.189957618713379, + "train/negative_loss": 2.247539520263672, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9424179792404175, + "train/total_loss": 0.8565723299980164 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.24484141170978546, - "train/contrastive_loss": 3.5462613105773926, - "train/negative_loss": 1.872650146484375, + "train/classification_loss": 0.19780108332633972, + "train/contrastive_loss": 2.1977226734161377, + "train/negative_loss": 2.1974360942840576, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.6736111640930176, - "train/total_loss": 0.9540936946868896 + "train/num_positives": 4, + "train/positive_loss": 0.000286687194602564, + "train/total_loss": 0.6373456120491028 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15682010352611542, - "train/contrastive_loss": 3.3674654960632324, - "train/negative_loss": 2.369922399520874, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.997543215751648, - "train/total_loss": 0.8303132057189941 + "train/classification_loss": 0.18451203405857086, + "train/contrastive_loss": 0.856658935546875, + "train/negative_loss": 0.8316022753715515, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.025056643411517143, + "train/total_loss": 0.35584384202957153 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.22461089491844177, - "train/contrastive_loss": 2.4659464359283447, - "train/negative_loss": 1.0316089391708374, - "train/num_negatives": 40, + "train/classification_loss": 0.2588823437690735, + "train/contrastive_loss": 2.892712116241455, + "train/negative_loss": 1.6340378522872925, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.4343374967575073, - "train/total_loss": 0.7178001999855042 - }, - { - "epoch": 10.26615969581749, - "step": 2700, - "train/classification_loss": 0.21787135303020477, - "train/contrastive_loss": 1.6512116193771362, - "train/negative_loss": 1.3941320180892944, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2570795714855194, - "train/total_loss": 0.5481137037277222 - }, - { - "epoch": 10.26615969581749, - "step": 2700, - "train/classification_loss": 0.15320539474487305, - "train/contrastive_loss": 2.744717836380005, - "train/negative_loss": 1.119246482849121, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.6254713535308838, - "train/total_loss": 0.702148973941803 + "train/positive_loss": 1.258674144744873, + "train/total_loss": 0.8374247550964355 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.22996185719966888, - "train/contrastive_loss": 2.2637557983398438, - "train/negative_loss": 0.9195767641067505, + "train/classification_loss": 0.1945541948080063, + "train/contrastive_loss": 0.9771105647087097, + "train/negative_loss": 0.9692712426185608, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3441791534423828, - "train/total_loss": 0.6827130317687988 - }, - { - "epoch": 10.26615969581749, - "step": 2700, - "train/classification_loss": 0.2705939710140228, - "train/contrastive_loss": 1.788887858390808, - "train/negative_loss": 1.7883367538452148, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0005510775372385979, - "train/total_loss": 0.62837153673172 + "train/num_positives": 10, + "train/positive_loss": 0.007839331403374672, + "train/total_loss": 0.3899763226509094 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17775101959705353, - "train/contrastive_loss": 1.0733227729797363, - "train/negative_loss": 0.6526709794998169, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.4206518530845642, - "train/total_loss": 0.3924155831336975 + "train/classification_loss": 0.1904030442237854, + "train/contrastive_loss": 1.8278334140777588, + "train/negative_loss": 1.5663201808929443, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.2615131735801697, + "train/total_loss": 0.5559697151184082 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.18972457945346832, - "train/contrastive_loss": 2.9098875522613525, - "train/negative_loss": 1.9580057859420776, + "train/classification_loss": 0.1648002415895462, + "train/contrastive_loss": 2.4086363315582275, + "train/negative_loss": 2.3721089363098145, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.9518817663192749, - "train/total_loss": 0.7717021107673645 + "train/positive_loss": 0.03652748838067055, + "train/total_loss": 0.6465275287628174 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17952391505241394, - "train/contrastive_loss": 4.40217924118042, - "train/negative_loss": 1.5808807611465454, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.821298599243164, - "train/total_loss": 1.0599597692489624 + "train/classification_loss": 0.184440016746521, + "train/contrastive_loss": 2.1555018424987793, + "train/negative_loss": 1.4502166509628296, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7052853107452393, + "train/total_loss": 0.6155403852462769 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.1387745887041092, - "train/contrastive_loss": 1.395110845565796, - "train/negative_loss": 0.6050763726234436, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.7900344133377075, - "train/total_loss": 0.417796790599823 + "train/classification_loss": 0.21587824821472168, + "train/contrastive_loss": 2.5807929039001465, + "train/negative_loss": 1.667168378829956, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.9136244654655457, + "train/total_loss": 0.732036828994751 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.1558210402727127, - "train/contrastive_loss": 0.8429834842681885, - "train/negative_loss": 0.8428046107292175, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.00017888953152578324, - "train/total_loss": 0.32441774010658264 + "train/classification_loss": 0.24265708029270172, + "train/contrastive_loss": 1.4171247482299805, + "train/negative_loss": 0.9620932340621948, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.45503151416778564, + "train/total_loss": 0.5260820388793945 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20373140275478363, - "train/contrastive_loss": 1.1604143381118774, - "train/negative_loss": 1.0761760473251343, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.08423826098442078, - "train/total_loss": 0.4358142614364624 + "train/classification_loss": 0.14479337632656097, + "train/contrastive_loss": 2.200500249862671, + "train/negative_loss": 2.2004213333129883, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 7.887629908509552e-05, + "train/total_loss": 0.5848934054374695 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17158479988574982, - "train/contrastive_loss": 1.7054078578948975, - "train/negative_loss": 1.7043185234069824, + "train/classification_loss": 0.1943824738264084, + "train/contrastive_loss": 1.702411413192749, + "train/negative_loss": 0.810370147228241, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0010893315775319934, - "train/total_loss": 0.5126664042472839 + "train/num_positives": 8, + "train/positive_loss": 0.8920413255691528, + "train/total_loss": 0.5348647832870483 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.16692818701267242, - "train/contrastive_loss": 0.8309076428413391, - "train/negative_loss": 0.8028132915496826, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.02809436246752739, - "train/total_loss": 0.3331097364425659 + "train/classification_loss": 0.21114720404148102, + "train/contrastive_loss": 1.6703277826309204, + "train/negative_loss": 1.5292900800704956, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.14103767275810242, + "train/total_loss": 0.5452127456665039 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20091387629508972, - "train/contrastive_loss": 2.537557601928711, - "train/negative_loss": 1.7493669986724854, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.7881907224655151, - "train/total_loss": 0.7084254026412964 + "train/classification_loss": 0.19728179275989532, + "train/contrastive_loss": 0.6125668883323669, + "train/negative_loss": 0.46839651465415955, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.1441703587770462, + "train/total_loss": 0.319795161485672 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.21004104614257812, - "train/contrastive_loss": 1.5795204639434814, - "train/negative_loss": 0.7047677636146545, + "train/classification_loss": 0.29019972681999207, + "train/contrastive_loss": 4.630445957183838, + "train/negative_loss": 1.6993427276611328, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.8747527003288269, - "train/total_loss": 0.5259451866149902 + "train/num_positives": 8, + "train/positive_loss": 2.931103229522705, + "train/total_loss": 1.2162889242172241 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15193383395671844, - "train/contrastive_loss": 2.3372104167938232, - "train/negative_loss": 1.563673973083496, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.7735363841056824, - "train/total_loss": 0.6193759441375732 + "train/classification_loss": 0.1425984799861908, + "train/contrastive_loss": 1.1256687641143799, + "train/negative_loss": 0.8306665420532227, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.29500219225883484, + "train/total_loss": 0.3677322268486023 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15757791697978973, - "train/contrastive_loss": 1.141615867614746, - "train/negative_loss": 0.3409428596496582, - "train/num_negatives": 40, + "train/classification_loss": 0.19690319895744324, + "train/contrastive_loss": 2.0265026092529297, + "train/negative_loss": 1.3792775869369507, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8006730675697327, - "train/total_loss": 0.3859010934829712 + "train/positive_loss": 0.647225022315979, + "train/total_loss": 0.6022037267684937 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.26380619406700134, - "train/contrastive_loss": 1.5141735076904297, - "train/negative_loss": 1.175995111465454, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.3381783962249756, - "train/total_loss": 0.5666409134864807 + "train/classification_loss": 0.16565266251564026, + "train/contrastive_loss": 0.9898386597633362, + "train/negative_loss": 0.989719808101654, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00011883485422004014, + "train/total_loss": 0.363620400428772 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.09736084938049316, - "train/contrastive_loss": 0.20844757556915283, - "train/negative_loss": 0.20844146609306335, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 6.1095061028026976e-06, - "train/total_loss": 0.13905036449432373 + "train/classification_loss": 0.275462806224823, + "train/contrastive_loss": 1.6302192211151123, + "train/negative_loss": 0.9540430307388306, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.6761762499809265, + "train/total_loss": 0.6015066504478455 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.13078874349594116, - "train/contrastive_loss": 1.1340830326080322, - "train/negative_loss": 0.41620105504989624, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7178819179534912, - "train/total_loss": 0.35760533809661865 + "train/classification_loss": 0.16976973414421082, + "train/contrastive_loss": 2.2232112884521484, + "train/negative_loss": 2.210834264755249, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.01237698458135128, + "train/total_loss": 0.6144120097160339 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.12285593152046204, - "train/contrastive_loss": 1.3861632347106934, - "train/negative_loss": 1.091135025024414, + "train/classification_loss": 0.32502618432044983, + "train/contrastive_loss": 2.4733924865722656, + "train/negative_loss": 1.3015379905700684, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.2950281798839569, - "train/total_loss": 0.4000885784626007 + "train/num_positives": 18, + "train/positive_loss": 1.1718544960021973, + "train/total_loss": 0.8197046518325806 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17242969572544098, - "train/contrastive_loss": 1.0556013584136963, - "train/negative_loss": 0.4324924945831299, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.6231088042259216, - "train/total_loss": 0.3835499882698059 + "train/classification_loss": 0.17891135811805725, + "train/contrastive_loss": 3.392833948135376, + "train/negative_loss": 1.1546037197113037, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.2382302284240723, + "train/total_loss": 0.857478141784668 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.13811913132667542, - "train/contrastive_loss": 1.8297760486602783, - "train/negative_loss": 0.8298412561416626, + "train/classification_loss": 0.18559923768043518, + "train/contrastive_loss": 3.554265022277832, + "train/negative_loss": 2.835493326187134, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9999348521232605, - "train/total_loss": 0.5040743350982666 + "train/positive_loss": 0.7187715768814087, + "train/total_loss": 0.8964523077011108 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15268731117248535, - "train/contrastive_loss": 0.4205664396286011, - "train/negative_loss": 0.41955864429473877, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0010077808983623981, - "train/total_loss": 0.23680061101913452 + "train/classification_loss": 0.25483810901641846, + "train/contrastive_loss": 2.615293502807617, + "train/negative_loss": 2.6152801513671875, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 1.3232318451628089e-05, + "train/total_loss": 0.7778968214988708 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.21235650777816772, - "train/contrastive_loss": 3.477351427078247, - "train/negative_loss": 1.49769127368927, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.979660153388977, - "train/total_loss": 0.9078267812728882 + "train/classification_loss": 0.19435539841651917, + "train/contrastive_loss": 2.512592077255249, + "train/negative_loss": 0.9203905463218689, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.5922014713287354, + "train/total_loss": 0.6968737840652466 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.23095658421516418, - "train/contrastive_loss": 2.0823824405670166, - "train/negative_loss": 0.9203819036483765, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.1620005369186401, - "train/total_loss": 0.6474330425262451 + "train/classification_loss": 0.1328953057527542, + "train/contrastive_loss": 0.22658661007881165, + "train/negative_loss": 0.11732051521539688, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.10926608741283417, + "train/total_loss": 0.17821262776851654 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20852893590927124, - "train/contrastive_loss": 2.5437328815460205, - "train/negative_loss": 0.6161590218544006, + "train/classification_loss": 0.19937169551849365, + "train/contrastive_loss": 1.1343051195144653, + "train/negative_loss": 1.110209345817566, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.927573800086975, - "train/total_loss": 0.7172755002975464 + "train/num_positives": 8, + "train/positive_loss": 0.024095721542835236, + "train/total_loss": 0.4262327253818512 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.138098806142807, - "train/contrastive_loss": 2.1247193813323975, - "train/negative_loss": 0.944364070892334, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1803553104400635, - "train/total_loss": 0.5630427002906799 + "train/classification_loss": 0.18528319895267487, + "train/contrastive_loss": 1.4506970643997192, + "train/negative_loss": 1.4143707752227783, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.036326318979263306, + "train/total_loss": 0.47542262077331543 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2645812928676605, - "train/contrastive_loss": 3.4152626991271973, - "train/negative_loss": 1.5373241901397705, - "train/num_negatives": 46, + "train/classification_loss": 0.3076325058937073, + "train/contrastive_loss": 3.3048787117004395, + "train/negative_loss": 1.1579900979995728, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 1.8779386281967163, - "train/total_loss": 0.9476338624954224 + "train/positive_loss": 2.146888494491577, + "train/total_loss": 0.9686082601547241 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.22182868421077728, - "train/contrastive_loss": 3.308680534362793, - "train/negative_loss": 1.8523845672607422, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4562959671020508, - "train/total_loss": 0.883564829826355 + "train/classification_loss": 0.13595907390117645, + "train/contrastive_loss": 0.7254592180252075, + "train/negative_loss": 0.5122767090797424, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.2131824940443039, + "train/total_loss": 0.2810509204864502 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20286521315574646, - "train/contrastive_loss": 2.970404624938965, - "train/negative_loss": 1.1128644943237305, + "train/classification_loss": 0.11226639896631241, + "train/contrastive_loss": 0.4652174413204193, + "train/negative_loss": 0.4139293432235718, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 1.8575401306152344, - "train/total_loss": 0.7969461679458618 + "train/positive_loss": 0.05128810182213783, + "train/total_loss": 0.2053098976612091 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.1604146659374237, + "train/contrastive_loss": 2.3324451446533203, + "train/negative_loss": 1.2000235319137573, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.1324217319488525, + "train/total_loss": 0.6269037127494812 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2126314789056778, - "train/contrastive_loss": 4.017848491668701, - "train/negative_loss": 1.724530816078186, + "train/classification_loss": 0.2118668407201767, + "train/contrastive_loss": 3.014366626739502, + "train/negative_loss": 1.657504916191101, "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.3568618297576904, + "train/total_loss": 0.8147401809692383 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.18209993839263916, + "train/contrastive_loss": 0.9660111665725708, + "train/negative_loss": 0.7024995684623718, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.26351162791252136, + "train/total_loss": 0.37530219554901123 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.11673104017972946, + "train/contrastive_loss": 0.6742532253265381, + "train/negative_loss": 0.40294432640075684, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.27130889892578125, + "train/total_loss": 0.25158169865608215 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.19410599768161774, + "train/contrastive_loss": 2.5448427200317383, + "train/negative_loss": 1.4728997945785522, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 2.2933175563812256, - "train/total_loss": 1.0162012577056885 + "train/positive_loss": 1.0719430446624756, + "train/total_loss": 0.7030745148658752 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.21603676676750183, - "train/contrastive_loss": 1.9913511276245117, - "train/negative_loss": 1.0470718145370483, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9442792534828186, - "train/total_loss": 0.6143069863319397 + "train/classification_loss": 0.255287766456604, + "train/contrastive_loss": 1.4933267831802368, + "train/negative_loss": 1.1634098291397095, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 0.32991698384284973, + "train/total_loss": 0.5539531707763672 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.13877858221530914, + "train/contrastive_loss": 1.856605887413025, + "train/negative_loss": 1.4671188592910767, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.38948702812194824, + "train/total_loss": 0.5100997686386108 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.1751866638660431, + "train/contrastive_loss": 0.5172592401504517, + "train/negative_loss": 0.45144206285476685, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0658172070980072, + "train/total_loss": 0.2786385118961334 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.16447676718235016, + "train/contrastive_loss": 1.8310130834579468, + "train/negative_loss": 0.4243212640285492, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.4066917896270752, + "train/total_loss": 0.5306794047355652 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.2537527084350586, - "train/contrastive_loss": 3.335238456726074, - "train/negative_loss": 1.3512930870056152, + "train/classification_loss": 0.16225150227546692, + "train/contrastive_loss": 4.991938591003418, + "train/negative_loss": 4.991936683654785, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.9431149667070713e-06, + "train/total_loss": 1.1606392860412598 + }, + { + "epoch": 9.507042253521126, + "step": 2700, + "train/classification_loss": 0.1687004566192627, + "train/contrastive_loss": 1.6625807285308838, + "train/negative_loss": 0.4287572503089905, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.9839454889297485, - "train/total_loss": 0.9208003878593445 + "train/positive_loss": 1.233823537826538, + "train/total_loss": 0.5012166500091553 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.1678508073091507, - "train/contrastive_loss": 0.8432839512825012, - "train/negative_loss": 0.8430501222610474, + "train/classification_loss": 0.21064788103103638, + "train/contrastive_loss": 2.6139304637908936, + "train/negative_loss": 2.035810947418213, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0002338238264201209, - "train/total_loss": 0.3365076184272766 + "train/num_positives": 8, + "train/positive_loss": 0.5781194567680359, + "train/total_loss": 0.7334339618682861 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.17522963881492615, - "train/contrastive_loss": 1.4549951553344727, - "train/negative_loss": 1.02342689037323, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.43156829476356506, - "train/total_loss": 0.4662286639213562 + "train/classification_loss": 0.1537582129240036, + "train/contrastive_loss": 1.8837095499038696, + "train/negative_loss": 0.9978513121604919, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.8858582377433777, + "train/total_loss": 0.5305001139640808 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.13671547174453735, - "train/contrastive_loss": 0.7889689207077026, - "train/negative_loss": 0.4190372824668884, - "train/num_negatives": 46, + "train/classification_loss": 0.2564479112625122, + "train/contrastive_loss": 1.8451323509216309, + "train/negative_loss": 1.3986173868179321, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.3699316382408142, - "train/total_loss": 0.29450926184654236 + "train/positive_loss": 0.44651490449905396, + "train/total_loss": 0.6254743933677673 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.20973829925060272, - "train/contrastive_loss": 1.8284860849380493, - "train/negative_loss": 1.8284860849380493, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5754355192184448 - }, - { - "epoch": 10.26615969581749, - "eval_exact_match_accuracy": 0.29523809523809524, - "eval_hamming_loss": 0.06767507002801121, - "eval_loss": 0.6086791753768921, - "eval_macro_f1": 0.35107541860645014, - "eval_macro_precision": 0.5374331691716865, - "eval_macro_recall": 0.27829387129774075, - "eval_micro_f1": 0.5545722713864307, - "eval_micro_precision": 0.7882599580712788, - "eval_micro_recall": 0.42775881683731515, - "eval_runtime": 2.6351, - "eval_samples_per_second": 199.231, - "eval_steps_per_second": 25.046, + "train/classification_loss": 0.18230153620243073, + "train/contrastive_loss": 1.692655324935913, + "train/negative_loss": 1.628920078277588, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.06373518705368042, + "train/total_loss": 0.5208325982093811 + }, + { + "epoch": 9.507042253521126, + "eval_exact_match_accuracy": 0.2786596119929453, + "eval_hamming_loss": 0.07127295362589481, + "eval_loss": 0.5910915732383728, + "eval_macro_f1": 0.3399007092993409, + "eval_macro_precision": 0.560983161895091, + "eval_macro_recall": 0.26820156138559786, + "eval_micro_f1": 0.5178947368421053, + "eval_micro_precision": 0.757700205338809, + "eval_micro_recall": 0.39339019189765456, + "eval_runtime": 2.8413, + "eval_samples_per_second": 199.56, + "eval_steps_per_second": 24.989, "step": 2700 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.15328989923000336, - "train/contrastive_loss": 0.36967015266418457, - "train/negative_loss": 0.2904798090457916, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.07919035106897354, - "train/total_loss": 0.2272239327430725 + "train/classification_loss": 0.12901562452316284, + "train/contrastive_loss": 0.8175753951072693, + "train/negative_loss": 0.8139306902885437, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.003644683165475726, + "train/total_loss": 0.29253071546554565 }, { - "epoch": 10.26615969581749, + "epoch": 9.507042253521126, "step": 2700, - "train/classification_loss": 0.13309869170188904, - "train/contrastive_loss": 0.26945561170578003, - "train/negative_loss": 0.24946275353431702, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.019992846995592117, - "train/total_loss": 0.18698981404304504 + "train/classification_loss": 0.15829998254776, + "train/contrastive_loss": 1.8234858512878418, + "train/negative_loss": 1.3036770820617676, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.5198087096214294, + "train/total_loss": 0.5229971408843994 }, { - "epoch": 10.456273764258555, - "grad_norm": 4.659131050109863, - "learning_rate": 1.959710806697108e-05, - "loss": 0.6042, + "epoch": 9.683098591549296, + "grad_norm": 9.153973579406738, + "learning_rate": 1.9627061310782244e-05, + "loss": 0.6411, "step": 2750 }, { - "epoch": 10.456273764258555, + "epoch": 9.683098591549296, "step": 2750, - "train/classification_loss": 0.14212600886821747, - "train/contrastive_loss": 1.5235724449157715, - "train/negative_loss": 0.6297898888587952, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8937826156616211, - "train/total_loss": 0.4468405246734619 + "train/classification_loss": 0.11858583986759186, + "train/contrastive_loss": 0.4542088508605957, + "train/negative_loss": 0.40345609188079834, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.050752751529216766, + "train/total_loss": 0.209427610039711 }, { - "epoch": 10.456273764258555, + "epoch": 9.683098591549296, "step": 2750, - "train/classification_loss": 0.06530577689409256, - "train/contrastive_loss": 0.3175392150878906, - "train/negative_loss": 0.22487445175647736, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.09266476333141327, - "train/total_loss": 0.12881362438201904 + "train/classification_loss": 0.08259477466344833, + "train/contrastive_loss": 0.3632351756095886, + "train/negative_loss": 0.35160335898399353, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.011631814762949944, + "train/total_loss": 0.15524181723594666 }, { - "epoch": 10.64638783269962, - "grad_norm": 8.040148735046387, - "learning_rate": 1.958949771689498e-05, - "loss": 0.625, + "epoch": 9.859154929577464, + "grad_norm": 10.849760055541992, + "learning_rate": 1.96200140944327e-05, + "loss": 0.6916, "step": 2800 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2743460237979889, - "train/contrastive_loss": 2.4521713256835938, - "train/negative_loss": 1.080503225326538, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.3716679811477661, - "train/total_loss": 0.7647802829742432 + "train/classification_loss": 0.2422458976507187, + "train/contrastive_loss": 1.721174716949463, + "train/negative_loss": 1.2936679124832153, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.4275067448616028, + "train/total_loss": 0.5864808559417725 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.19949500262737274, - "train/contrastive_loss": 2.2236320972442627, - "train/negative_loss": 1.0917623043060303, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.1318697929382324, - "train/total_loss": 0.6442214250564575 + "train/classification_loss": 0.2578805983066559, + "train/contrastive_loss": 0.9033896923065186, + "train/negative_loss": 0.4029536247253418, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5004360675811768, + "train/total_loss": 0.43855851888656616 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18048112094402313, - "train/contrastive_loss": 2.1225266456604004, - "train/negative_loss": 0.8695245385169983, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.2530021667480469, - "train/total_loss": 0.6049864292144775 + "train/classification_loss": 0.2397628128528595, + "train/contrastive_loss": 2.841975450515747, + "train/negative_loss": 1.3694028854370117, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.4725725650787354, + "train/total_loss": 0.8081579208374023 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2560392916202545, - "train/contrastive_loss": 3.600142002105713, - "train/negative_loss": 1.7765650749206543, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.8235770463943481, - "train/total_loss": 0.9760676622390747 + "train/classification_loss": 0.14542058110237122, + "train/contrastive_loss": 2.0952982902526855, + "train/negative_loss": 1.056650161743164, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.038648247718811, + "train/total_loss": 0.5644802451133728 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.10946256667375565, - "train/contrastive_loss": 1.5924628973007202, - "train/negative_loss": 1.0481618642807007, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5443010330200195, - "train/total_loss": 0.42795515060424805 + "train/classification_loss": 0.1968403160572052, + "train/contrastive_loss": 2.0891003608703613, + "train/negative_loss": 1.5229990482330322, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.5661011934280396, + "train/total_loss": 0.614660382270813 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18927739560604095, - "train/contrastive_loss": 2.564500331878662, - "train/negative_loss": 1.333172082901001, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.2313281297683716, - "train/total_loss": 0.7021774649620056 + "train/classification_loss": 0.19998688995838165, + "train/contrastive_loss": 2.3039064407348633, + "train/negative_loss": 1.2318562269210815, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0720502138137817, + "train/total_loss": 0.6607682108879089 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.20733225345611572, - "train/contrastive_loss": 1.2982125282287598, - "train/negative_loss": 1.0468738079071045, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.2513386905193329, - "train/total_loss": 0.46697476506233215 + "train/classification_loss": 0.17715367674827576, + "train/contrastive_loss": 1.472278356552124, + "train/negative_loss": 0.7979770302772522, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.674301266670227, + "train/total_loss": 0.47160935401916504 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.16422389447689056, - "train/contrastive_loss": 2.1302523612976074, - "train/negative_loss": 1.4930636882781982, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6371886134147644, - "train/total_loss": 0.5902743935585022 + "train/classification_loss": 0.18147341907024384, + "train/contrastive_loss": 0.7004166841506958, + "train/negative_loss": 0.6988470554351807, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0015696082264184952, + "train/total_loss": 0.3215567469596863 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.15678644180297852, - "train/contrastive_loss": 1.3415343761444092, - "train/negative_loss": 1.3006476163864136, + "train/classification_loss": 0.10392995178699493, + "train/contrastive_loss": 0.953577995300293, + "train/negative_loss": 0.30992963910102844, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.04088672995567322, - "train/total_loss": 0.42509332299232483 + "train/positive_loss": 0.6436483860015869, + "train/total_loss": 0.2946455478668213 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.3226388394832611, - "train/contrastive_loss": 3.4809250831604004, - "train/negative_loss": 1.5914385318756104, + "train/classification_loss": 0.18369993567466736, + "train/contrastive_loss": 2.3295676708221436, + "train/negative_loss": 1.3953849077224731, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.8894864320755005, - "train/total_loss": 1.0188238620758057 + "train/num_positives": 14, + "train/positive_loss": 0.9341827630996704, + "train/total_loss": 0.6496134996414185 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1899259239435196, - "train/contrastive_loss": 2.7843027114868164, - "train/negative_loss": 1.6598905324935913, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.1244120597839355, - "train/total_loss": 0.7467864751815796 + "train/classification_loss": 0.1467398703098297, + "train/contrastive_loss": 1.3287410736083984, + "train/negative_loss": 0.6292564868927002, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.6994845271110535, + "train/total_loss": 0.41248810291290283 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.11051826179027557, - "train/contrastive_loss": 1.289538025856018, - "train/negative_loss": 0.3353061378002167, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9542319178581238, - "train/total_loss": 0.3684258460998535 + "train/classification_loss": 0.16137251257896423, + "train/contrastive_loss": 1.925856113433838, + "train/negative_loss": 1.0077437162399292, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.9181124567985535, + "train/total_loss": 0.5465437173843384 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.16975590586662292, - "train/contrastive_loss": 3.1306605339050293, - "train/negative_loss": 1.9896279573440552, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.1410324573516846, - "train/total_loss": 0.7958880662918091 + "train/classification_loss": 0.20013026893138885, + "train/contrastive_loss": 3.637685775756836, + "train/negative_loss": 1.4786475896835327, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.1590380668640137, + "train/total_loss": 0.9276674389839172 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.11393450200557709, - "train/contrastive_loss": 2.18772292137146, - "train/negative_loss": 2.187692880630493, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 3.002705125254579e-05, - "train/total_loss": 0.5514791011810303 + "train/classification_loss": 0.16525375843048096, + "train/contrastive_loss": 1.4299119710922241, + "train/negative_loss": 0.6464141607284546, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.7834978103637695, + "train/total_loss": 0.45123615860939026 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.11091789603233337, - "train/contrastive_loss": 1.2975338697433472, - "train/negative_loss": 1.0956522226333618, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.20188164710998535, - "train/total_loss": 0.37042468786239624 + "train/classification_loss": 0.14059491455554962, + "train/contrastive_loss": 3.1143014430999756, + "train/negative_loss": 0.7113563418388367, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.402945041656494, + "train/total_loss": 0.7634552121162415 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.14840707182884216, - "train/contrastive_loss": 0.9892300367355347, - "train/negative_loss": 0.43263545632362366, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.5565945506095886, - "train/total_loss": 0.34625309705734253 + "train/classification_loss": 0.15830004215240479, + "train/contrastive_loss": 1.034705400466919, + "train/negative_loss": 0.2746495008468628, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.7600558996200562, + "train/total_loss": 0.3652411103248596 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.24186818301677704, - "train/contrastive_loss": 2.391366481781006, - "train/negative_loss": 1.423585295677185, - "train/num_negatives": 40, + "train/classification_loss": 0.12019146233797073, + "train/contrastive_loss": 1.1123141050338745, + "train/negative_loss": 0.4054318368434906, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9677812457084656, - "train/total_loss": 0.7201414704322815 + "train/positive_loss": 0.7068822383880615, + "train/total_loss": 0.342654287815094 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1676045060157776, - "train/contrastive_loss": 2.058641195297241, - "train/negative_loss": 0.4846593737602234, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.573981761932373, - "train/total_loss": 0.579332709312439 + "train/classification_loss": 0.19889847934246063, + "train/contrastive_loss": 1.3846909999847412, + "train/negative_loss": 0.5369450449943542, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.8477458953857422, + "train/total_loss": 0.47583669424057007 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1830926388502121, - "train/contrastive_loss": 1.6482425928115845, - "train/negative_loss": 1.6384726762771606, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.009769903495907784, - "train/total_loss": 0.5127411484718323 + "train/classification_loss": 0.14434264600276947, + "train/contrastive_loss": 0.9681116342544556, + "train/negative_loss": 0.36274853348731995, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.6053630709648132, + "train/total_loss": 0.3379649817943573 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.15745943784713745, - "train/contrastive_loss": 2.143280267715454, - "train/negative_loss": 1.9277174472808838, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.2155628651380539, - "train/total_loss": 0.5861154794692993 + "train/classification_loss": 0.21232929825782776, + "train/contrastive_loss": 3.307300090789795, + "train/negative_loss": 1.3321508169174194, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.975149393081665, + "train/total_loss": 0.8737893104553223 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2022472769021988, - "train/contrastive_loss": 1.673172950744629, - "train/negative_loss": 0.3006562888622284, - "train/num_negatives": 44, + "train/classification_loss": 0.1258581280708313, + "train/contrastive_loss": 1.1267513036727905, + "train/negative_loss": 1.114208459854126, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3725166320800781, - "train/total_loss": 0.5368818640708923 + "train/positive_loss": 0.0125428456813097, + "train/total_loss": 0.3512083888053894 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2391534447669983, - "train/contrastive_loss": 1.8717283010482788, - "train/negative_loss": 0.94361811876297, - "train/num_negatives": 44, + "train/classification_loss": 0.13371552526950836, + "train/contrastive_loss": 2.8056769371032715, + "train/negative_loss": 1.911933422088623, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.9281101822853088, - "train/total_loss": 0.613499104976654 + "train/positive_loss": 0.893743634223938, + "train/total_loss": 0.6948509216308594 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.154268279671669, - "train/contrastive_loss": 1.855112075805664, - "train/negative_loss": 0.5767446160316467, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.278367519378662, - "train/total_loss": 0.5252907276153564 + "train/classification_loss": 0.13864447176456451, + "train/contrastive_loss": 1.1586953401565552, + "train/negative_loss": 0.8028740286827087, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.3558213412761688, + "train/total_loss": 0.3703835606575012 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.130403071641922, - "train/contrastive_loss": 0.27666300535202026, - "train/negative_loss": 0.20003899931907654, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.07662402093410492, - "train/total_loss": 0.18573567271232605 + "train/classification_loss": 0.2527272403240204, + "train/contrastive_loss": 3.6967899799346924, + "train/negative_loss": 1.8888001441955566, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.8079898357391357, + "train/total_loss": 0.9920852184295654 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.08703843504190445, - "train/contrastive_loss": 0.6127451658248901, - "train/negative_loss": 0.27566424012184143, + "train/classification_loss": 0.16538181900978088, + "train/contrastive_loss": 2.630919933319092, + "train/negative_loss": 0.9302123188972473, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.3370809257030487, - "train/total_loss": 0.2095874696969986 + "train/num_positives": 10, + "train/positive_loss": 1.7007076740264893, + "train/total_loss": 0.6915658712387085 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.28658702969551086, - "train/contrastive_loss": 1.9837487936019897, - "train/negative_loss": 0.49645426869392395, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.4872945547103882, - "train/total_loss": 0.6833367943763733 + "train/classification_loss": 0.23373982310295105, + "train/contrastive_loss": 2.723788261413574, + "train/negative_loss": 1.5791181325912476, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.144670009613037, + "train/total_loss": 0.7784974575042725 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.27034831047058105, - "train/contrastive_loss": 4.045159816741943, - "train/negative_loss": 1.5790975093841553, + "train/classification_loss": 0.19584132730960846, + "train/contrastive_loss": 2.3939971923828125, + "train/negative_loss": 2.336350679397583, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 2.466062307357788, - "train/total_loss": 1.0793802738189697 + "train/num_positives": 4, + "train/positive_loss": 0.05764659866690636, + "train/total_loss": 0.6746407747268677 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1516323685646057, - "train/contrastive_loss": 2.2811295986175537, - "train/negative_loss": 1.914392352104187, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.3667373061180115, - "train/total_loss": 0.6078583002090454 + "train/classification_loss": 0.1803833544254303, + "train/contrastive_loss": 0.295193076133728, + "train/negative_loss": 0.2837584912776947, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.011434579268097878, + "train/total_loss": 0.23942196369171143 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18720626831054688, - "train/contrastive_loss": 1.7073228359222412, - "train/negative_loss": 1.0633283853530884, - "train/num_negatives": 40, + "train/classification_loss": 0.2578928470611572, + "train/contrastive_loss": 2.998237371444702, + "train/negative_loss": 1.3674235343933105, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6439944505691528, - "train/total_loss": 0.5286708474159241 - }, - { - "epoch": 10.64638783269962, - "step": 2800, - "train/classification_loss": 0.21393060684204102, - "train/contrastive_loss": 1.1746633052825928, - "train/negative_loss": 0.6158263087272644, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.5588369369506836, - "train/total_loss": 0.44886326789855957 - }, - { - "epoch": 10.64638783269962, - "step": 2800, - "train/classification_loss": 0.15971742570400238, - "train/contrastive_loss": 3.992135763168335, - "train/negative_loss": 2.0191516876220703, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.9729840755462646, - "train/total_loss": 0.9581446051597595 + "train/positive_loss": 1.6308138370513916, + "train/total_loss": 0.8575403094291687 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.22860898077487946, - "train/contrastive_loss": 2.165438652038574, - "train/negative_loss": 1.2979649305343628, + "train/classification_loss": 0.17316599190235138, + "train/contrastive_loss": 0.3680519461631775, + "train/negative_loss": 0.3675346076488495, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8674737811088562, - "train/total_loss": 0.66169673204422 + "train/num_positives": 10, + "train/positive_loss": 0.0005173303070478141, + "train/total_loss": 0.24677637219429016 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.25656330585479736, - "train/contrastive_loss": 1.0426108837127686, - "train/negative_loss": 1.0413569211959839, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0012539138551801443, - "train/total_loss": 0.465085506439209 + "train/classification_loss": 0.16192907094955444, + "train/contrastive_loss": 1.2288349866867065, + "train/negative_loss": 0.8368066549301147, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.3920283615589142, + "train/total_loss": 0.40769606828689575 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.16843868792057037, - "train/contrastive_loss": 0.6748702526092529, - "train/negative_loss": 0.6665011048316956, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.00836913287639618, - "train/total_loss": 0.3034127354621887 + "train/classification_loss": 0.1536184400320053, + "train/contrastive_loss": 1.9579675197601318, + "train/negative_loss": 1.2453473806381226, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.7126200795173645, + "train/total_loss": 0.5452119708061218 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2194138914346695, - "train/contrastive_loss": 4.084502220153809, - "train/negative_loss": 2.645690441131592, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4388117790222168, - "train/total_loss": 1.0363143682479858 + "train/classification_loss": 0.17546148598194122, + "train/contrastive_loss": 1.2615089416503906, + "train/negative_loss": 0.624224841594696, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.6372841596603394, + "train/total_loss": 0.42776328325271606 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18862828612327576, - "train/contrastive_loss": 4.481968879699707, - "train/negative_loss": 1.802842378616333, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.679126501083374, - "train/total_loss": 1.0850220918655396 + "train/classification_loss": 0.2133786827325821, + "train/contrastive_loss": 2.3824925422668457, + "train/negative_loss": 1.7685984373092651, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.6138941049575806, + "train/total_loss": 0.6898772120475769 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1548377275466919, - "train/contrastive_loss": 1.3898818492889404, - "train/negative_loss": 0.49772509932518005, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.8921567797660828, - "train/total_loss": 0.4328140914440155 + "train/classification_loss": 0.2253674566745758, + "train/contrastive_loss": 1.4370590448379517, + "train/negative_loss": 0.9245150685310364, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5125439763069153, + "train/total_loss": 0.5127792358398438 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1783551126718521, - "train/contrastive_loss": 1.8974989652633667, - "train/negative_loss": 0.8661391735076904, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.0313597917556763, - "train/total_loss": 0.5578548908233643 + "train/classification_loss": 0.13447359204292297, + "train/contrastive_loss": 1.8005852699279785, + "train/negative_loss": 1.800480604171753, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.00010467678657732904, + "train/total_loss": 0.4945906400680542 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1987002193927765, - "train/contrastive_loss": 1.5245217084884644, - "train/negative_loss": 1.462691068649292, + "train/classification_loss": 0.19570650160312653, + "train/contrastive_loss": 1.7497758865356445, + "train/negative_loss": 0.5966654419898987, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.061830632388591766, - "train/total_loss": 0.503604531288147 + "train/positive_loss": 1.153110384941101, + "train/total_loss": 0.5456616878509521 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.17946648597717285, - "train/contrastive_loss": 1.9489930868148804, - "train/negative_loss": 1.9477403163909912, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0012527202488854527, - "train/total_loss": 0.5692651271820068 + "train/classification_loss": 0.2233089953660965, + "train/contrastive_loss": 2.3549704551696777, + "train/negative_loss": 2.2732763290405273, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0816941112279892, + "train/total_loss": 0.6943030953407288 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18922129273414612, - "train/contrastive_loss": 2.079664707183838, - "train/negative_loss": 1.0002127885818481, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0794520378112793, - "train/total_loss": 0.605154275894165 + "train/classification_loss": 0.2193119078874588, + "train/contrastive_loss": 1.410846471786499, + "train/negative_loss": 0.5325482487678528, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.8782982230186462, + "train/total_loss": 0.5014812350273132 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18284469842910767, - "train/contrastive_loss": 2.533952236175537, - "train/negative_loss": 2.0142605304718018, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.5196918249130249, - "train/total_loss": 0.689635157585144 + "train/classification_loss": 0.2568223774433136, + "train/contrastive_loss": 4.215339660644531, + "train/negative_loss": 1.7484999895095825, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 2.4668397903442383, + "train/total_loss": 1.0998903512954712 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.14489434659481049, + "train/contrastive_loss": 1.600229024887085, + "train/negative_loss": 0.7183215022087097, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.8819074630737305, + "train/total_loss": 0.4649401307106018 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1999458521604538, - "train/contrastive_loss": 1.1343432664871216, - "train/negative_loss": 0.4284712076187134, + "train/classification_loss": 0.19604523479938507, + "train/contrastive_loss": 3.19573974609375, + "train/negative_loss": 1.3959224224090576, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.7058720588684082, - "train/total_loss": 0.4268144965171814 + "train/num_positives": 14, + "train/positive_loss": 1.7998173236846924, + "train/total_loss": 0.8351931571960449 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.14183597266674042, - "train/contrastive_loss": 2.0958406925201416, - "train/negative_loss": 1.350545883178711, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.7452948093414307, - "train/total_loss": 0.561004102230072 + "train/classification_loss": 0.15760312974452972, + "train/contrastive_loss": 0.4566722810268402, + "train/negative_loss": 0.45651084184646606, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00016143334505613893, + "train/total_loss": 0.24893757700920105 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.23440247774124146, + "train/contrastive_loss": 0.9202690124511719, + "train/negative_loss": 0.6256960034370422, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.29457297921180725, + "train/total_loss": 0.4184562861919403 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1456291526556015, - "train/contrastive_loss": 0.90718674659729, - "train/negative_loss": 0.5129501223564148, + "train/classification_loss": 0.18507640063762665, + "train/contrastive_loss": 2.756464719772339, + "train/negative_loss": 2.0327699184417725, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.39423662424087524, - "train/total_loss": 0.3270665109157562 + "train/num_positives": 12, + "train/positive_loss": 0.7236948013305664, + "train/total_loss": 0.7363693714141846 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.27910155057907104, - "train/contrastive_loss": 2.273566961288452, - "train/negative_loss": 1.073786735534668, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.1997802257537842, - "train/total_loss": 0.7338149547576904 + "train/classification_loss": 0.3184349834918976, + "train/contrastive_loss": 1.9404232501983643, + "train/negative_loss": 0.8505808115005493, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 1.089842438697815, + "train/total_loss": 0.706519603729248 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.15520323812961578, + "train/contrastive_loss": 2.6822690963745117, + "train/negative_loss": 0.999466061592102, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.6828030347824097, + "train/total_loss": 0.6916570663452148 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.18790845572948456, + "train/contrastive_loss": 2.603407859802246, + "train/negative_loss": 2.186038017272949, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.4173697233200073, + "train/total_loss": 0.708590030670166 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.10662133991718292, - "train/contrastive_loss": 0.9300322532653809, - "train/negative_loss": 0.9300276041030884, + "train/classification_loss": 0.26583942770957947, + "train/contrastive_loss": 2.217435121536255, + "train/negative_loss": 2.2174315452575684, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 4.6491795728798024e-06, - "train/total_loss": 0.29262781143188477 + "train/num_positives": 2, + "train/positive_loss": 3.57628505298635e-06, + "train/total_loss": 0.709326446056366 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.11402805894613266, - "train/contrastive_loss": 0.21971988677978516, - "train/negative_loss": 0.21856659650802612, - "train/num_negatives": 38, + "train/classification_loss": 0.2037402093410492, + "train/contrastive_loss": 2.2504491806030273, + "train/negative_loss": 1.1650561094284058, + "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.0011532960925251245, - "train/total_loss": 0.1579720377922058 + "train/positive_loss": 1.0853931903839111, + "train/total_loss": 0.6538300514221191 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.09192099422216415, - "train/contrastive_loss": 0.8380711078643799, - "train/negative_loss": 0.8364946246147156, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0015764966374263167, - "train/total_loss": 0.2595352232456207 + "train/classification_loss": 0.1263217329978943, + "train/contrastive_loss": 0.14254340529441833, + "train/negative_loss": 0.08723662793636322, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.05530676990747452, + "train/total_loss": 0.15483041107654572 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1741214394569397, - "train/contrastive_loss": 1.2754836082458496, - "train/negative_loss": 1.0051844120025635, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.2702992558479309, - "train/total_loss": 0.4292181730270386 + "train/classification_loss": 0.19413205981254578, + "train/contrastive_loss": 0.9580098986625671, + "train/negative_loss": 0.7995215058326721, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.15848837792873383, + "train/total_loss": 0.38573402166366577 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.14051669836044312, - "train/contrastive_loss": 2.173161745071411, - "train/negative_loss": 1.2408487796783447, - "train/num_negatives": 42, + "train/classification_loss": 0.1995437741279602, + "train/contrastive_loss": 1.3031272888183594, + "train/negative_loss": 1.10425865650177, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 0.9323130249977112, - "train/total_loss": 0.5751490592956543 + "train/positive_loss": 0.19886858761310577, + "train/total_loss": 0.4601692259311676 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.14948849380016327, - "train/contrastive_loss": 0.4013515114784241, - "train/negative_loss": 0.393065869808197, - "train/num_negatives": 50, + "train/classification_loss": 0.3115212023258209, + "train/contrastive_loss": 2.1659932136535645, + "train/negative_loss": 1.0569956302642822, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 0.008285634219646454, - "train/total_loss": 0.22975879907608032 + "train/positive_loss": 1.1089975833892822, + "train/total_loss": 0.7447198629379272 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.18970680236816406, - "train/contrastive_loss": 1.7480924129486084, - "train/negative_loss": 0.9232333898544312, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.824859082698822, - "train/total_loss": 0.5393252968788147 + "train/classification_loss": 0.13202039897441864, + "train/contrastive_loss": 0.6856703758239746, + "train/negative_loss": 0.4037132263183594, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.28195711970329285, + "train/total_loss": 0.26915448904037476 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.24652916193008423, - "train/contrastive_loss": 2.8718438148498535, - "train/negative_loss": 1.9531532526016235, + "train/classification_loss": 0.13055665791034698, + "train/contrastive_loss": 0.8618555665016174, + "train/negative_loss": 0.422348290681839, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.91869056224823, - "train/total_loss": 0.8208979368209839 + "train/positive_loss": 0.43950727581977844, + "train/total_loss": 0.30292779207229614 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.15074796974658966, + "train/contrastive_loss": 1.8078230619430542, + "train/negative_loss": 0.6606121063232422, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.147210955619812, + "train/total_loss": 0.5123125910758972 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.189544677734375, + "train/contrastive_loss": 2.6949150562286377, + "train/negative_loss": 1.2093682289123535, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.4855468273162842, + "train/total_loss": 0.7285277247428894 + }, + { + "epoch": 9.859154929577464, + "step": 2800, + "train/classification_loss": 0.1958393156528473, + "train/contrastive_loss": 1.5279107093811035, + "train/negative_loss": 0.6890113353729248, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.8388993144035339, + "train/total_loss": 0.5014214515686035 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.17346300184726715, - "train/contrastive_loss": 0.7914299964904785, - "train/negative_loss": 0.42296767234802246, + "train/classification_loss": 0.09453032165765762, + "train/contrastive_loss": 0.47734537720680237, + "train/negative_loss": 0.1615724265575409, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.36846235394477844, - "train/total_loss": 0.3317490220069885 + "train/num_positives": 16, + "train/positive_loss": 0.3157729506492615, + "train/total_loss": 0.18999940156936646 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.15819025039672852, - "train/contrastive_loss": 2.3373260498046875, - "train/negative_loss": 1.0983611345291138, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2389650344848633, - "train/total_loss": 0.625655472278595 + "train/classification_loss": 0.19003990292549133, + "train/contrastive_loss": 2.1613221168518066, + "train/negative_loss": 1.2775293588638306, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.8837928771972656, + "train/total_loss": 0.6223043203353882 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2528201639652252, - "train/contrastive_loss": 4.336633682250977, - "train/negative_loss": 1.2842013835906982, + "train/classification_loss": 0.250262051820755, + "train/contrastive_loss": 1.6377253532409668, + "train/negative_loss": 0.8702628016471863, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 3.052432060241699, - "train/total_loss": 1.1201468706130981 + "train/num_positives": 2, + "train/positive_loss": 0.7674626111984253, + "train/total_loss": 0.5778071284294128 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2121557593345642, - "train/contrastive_loss": 3.4576375484466553, - "train/negative_loss": 1.599273681640625, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8583638668060303, - "train/total_loss": 0.9036833047866821 + "train/classification_loss": 0.14335666596889496, + "train/contrastive_loss": 1.5191998481750488, + "train/negative_loss": 0.9416450262069702, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.5775548219680786, + "train/total_loss": 0.4471966624259949 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.191873237490654, - "train/contrastive_loss": 2.541205406188965, - "train/negative_loss": 1.2708439826965332, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.270361304283142, - "train/total_loss": 0.700114369392395 + "train/classification_loss": 0.20338916778564453, + "train/contrastive_loss": 0.7640072703361511, + "train/negative_loss": 0.5475155711174011, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.2164916843175888, + "train/total_loss": 0.35619062185287476 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.22249889373779297, - "train/contrastive_loss": 4.224816799163818, - "train/negative_loss": 1.83634614944458, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.3884706497192383, - "train/total_loss": 1.0674622058868408 + "train/classification_loss": 0.17595137655735016, + "train/contrastive_loss": 2.362671375274658, + "train/negative_loss": 0.6120171546936035, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.7506542205810547, + "train/total_loss": 0.6484856605529785 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.22678980231285095, - "train/contrastive_loss": 3.0392181873321533, - "train/negative_loss": 2.288062572479248, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.75115567445755, - "train/total_loss": 0.834633469581604 + "train/classification_loss": 0.16194500029087067, + "train/contrastive_loss": 4.332770347595215, + "train/negative_loss": 4.33276891708374, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.466275875827705e-06, + "train/total_loss": 1.0284991264343262 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.2790624499320984, - "train/contrastive_loss": 3.622471809387207, - "train/negative_loss": 1.7420179843902588, + "train/classification_loss": 0.17135140299797058, + "train/contrastive_loss": 1.140178918838501, + "train/negative_loss": 0.3936411142349243, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.8804539442062378, - "train/total_loss": 1.0035568475723267 + "train/positive_loss": 0.7465378642082214, + "train/total_loss": 0.3993871808052063 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.17414724826812744, - "train/contrastive_loss": 0.6907026171684265, - "train/negative_loss": 0.6876643896102905, + "train/classification_loss": 0.19975849986076355, + "train/contrastive_loss": 2.2232303619384766, + "train/negative_loss": 1.2000625133514404, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0030382282566279173, - "train/total_loss": 0.3122877776622772 + "train/num_positives": 8, + "train/positive_loss": 1.0231679677963257, + "train/total_loss": 0.6444045901298523 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.17232745885849, - "train/contrastive_loss": 1.8300108909606934, - "train/negative_loss": 1.507612943649292, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.32239797711372375, - "train/total_loss": 0.5383296012878418 + "train/classification_loss": 0.1608150750398636, + "train/contrastive_loss": 2.643754482269287, + "train/negative_loss": 0.8494847416877747, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.7942698001861572, + "train/total_loss": 0.6895659565925598 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1231592670083046, - "train/contrastive_loss": 1.1113731861114502, - "train/negative_loss": 0.3543608486652374, - "train/num_negatives": 46, + "train/classification_loss": 0.24466247856616974, + "train/contrastive_loss": 1.6202069520950317, + "train/negative_loss": 0.9127046465873718, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.7570123672485352, - "train/total_loss": 0.34543392062187195 + "train/positive_loss": 0.7075023055076599, + "train/total_loss": 0.5687038898468018 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.20448505878448486, - "train/contrastive_loss": 1.7337985038757324, - "train/negative_loss": 1.7337985038757324, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5512447357177734 - }, - { - "epoch": 10.64638783269962, - "eval_exact_match_accuracy": 0.31047619047619046, - "eval_hamming_loss": 0.06745098039215686, - "eval_loss": 0.5937800407409668, - "eval_macro_f1": 0.34223224265415836, - "eval_macro_precision": 0.5671291073267033, - "eval_macro_recall": 0.26885810139432437, - "eval_micro_f1": 0.5599415204678363, - "eval_micro_precision": 0.7832310838445807, - "eval_micro_recall": 0.43572241183162685, - "eval_runtime": 2.6321, - "eval_samples_per_second": 199.459, - "eval_steps_per_second": 25.075, + "train/classification_loss": 0.16331139206886292, + "train/contrastive_loss": 0.4944665729999542, + "train/negative_loss": 0.41176989674568176, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.08269666880369186, + "train/total_loss": 0.26220470666885376 + }, + { + "epoch": 9.859154929577464, + "eval_exact_match_accuracy": 0.2892416225749559, + "eval_hamming_loss": 0.06795310716879345, + "eval_loss": 0.5553329586982727, + "eval_macro_f1": 0.3898906591099431, + "eval_macro_precision": 0.6353736023298848, + "eval_macro_recall": 0.3207501530327882, + "eval_micro_f1": 0.5416375087473758, + "eval_micro_precision": 0.7881873727087576, + "eval_micro_recall": 0.4125799573560768, + "eval_runtime": 2.8425, + "eval_samples_per_second": 199.47, + "eval_steps_per_second": 24.978, "step": 2800 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.12091280519962311, - "train/contrastive_loss": 0.3634587824344635, - "train/negative_loss": 0.3564610183238983, - "train/num_negatives": 22, - "train/num_positives": 26, - "train/positive_loss": 0.006997766438871622, - "train/total_loss": 0.19360455870628357 + "train/classification_loss": 0.19349829852581024, + "train/contrastive_loss": 1.3443948030471802, + "train/negative_loss": 0.7074541449546814, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.6369406580924988, + "train/total_loss": 0.46237725019454956 }, { - "epoch": 10.64638783269962, + "epoch": 9.859154929577464, "step": 2800, - "train/classification_loss": 0.1648751050233841, - "train/contrastive_loss": 0.37624457478523254, - "train/negative_loss": 0.376228004693985, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 1.657027860346716e-05, - "train/total_loss": 0.24012401700019836 + "train/classification_loss": 0.14223407208919525, + "train/contrastive_loss": 0.6640971899032593, + "train/negative_loss": 0.6640753746032715, + "train/num_negatives": 52, + "train/num_positives": 2, + "train/positive_loss": 2.1815538275404833e-05, + "train/total_loss": 0.2750535011291504 }, { - "epoch": 10.836501901140684, - "grad_norm": 7.758701801300049, - "learning_rate": 1.9581887366818874e-05, - "loss": 0.5981, + "epoch": 10.035211267605634, + "grad_norm": 7.347024440765381, + "learning_rate": 1.961296687808316e-05, + "loss": 0.6289, "step": 2850 }, { - "epoch": 10.836501901140684, + "epoch": 10.035211267605634, "step": 2850, - "train/classification_loss": 0.14277829229831696, - "train/contrastive_loss": 0.6613541841506958, - "train/negative_loss": 0.5814878344535828, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.07986634224653244, - "train/total_loss": 0.2750491499900818 + "train/classification_loss": 0.16506929695606232, + "train/contrastive_loss": 0.8735600113868713, + "train/negative_loss": 0.27111417055130005, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.6024458408355713, + "train/total_loss": 0.3397812843322754 }, { - "epoch": 10.836501901140684, + "epoch": 10.035211267605634, "step": 2850, - "train/classification_loss": 0.11084019392728806, - "train/contrastive_loss": 0.5428822636604309, - "train/negative_loss": 0.5382305383682251, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.004651741124689579, - "train/total_loss": 0.21941664814949036 + "train/classification_loss": 0.16181811690330505, + "train/contrastive_loss": 0.7897449731826782, + "train/negative_loss": 0.5512301325798035, + "train/num_negatives": 24, + "train/num_positives": 24, + "train/positive_loss": 0.23851487040519714, + "train/total_loss": 0.3197671175003052 }, { - "epoch": 11.02661596958175, - "grad_norm": 5.387200832366943, - "learning_rate": 1.9574277016742772e-05, - "loss": 0.5915, + "epoch": 10.211267605633802, + "grad_norm": 6.384469985961914, + "learning_rate": 1.9605919661733618e-05, + "loss": 0.6112, "step": 2900 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.2585763931274414, - "train/contrastive_loss": 1.740926742553711, - "train/negative_loss": 0.7628422975540161, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.97808438539505, - "train/total_loss": 0.6067617535591125 + "train/classification_loss": 0.2628132700920105, + "train/contrastive_loss": 1.5475016832351685, + "train/negative_loss": 1.4081183671951294, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.13938328623771667, + "train/total_loss": 0.5723136067390442 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19097460806369781, - "train/contrastive_loss": 1.8367418050765991, - "train/negative_loss": 1.367160439491272, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.46958136558532715, - "train/total_loss": 0.5583229660987854 + "train/classification_loss": 0.23209384083747864, + "train/contrastive_loss": 1.1163294315338135, + "train/negative_loss": 0.36060935258865356, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.7557200193405151, + "train/total_loss": 0.45535972714424133 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.14892542362213135, - "train/contrastive_loss": 0.9131455421447754, - "train/negative_loss": 0.4388388693332672, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.4743066728115082, - "train/total_loss": 0.3315545320510864 + "train/classification_loss": 0.21153056621551514, + "train/contrastive_loss": 3.230170249938965, + "train/negative_loss": 2.0683212280273438, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.161849021911621, + "train/total_loss": 0.8575646281242371 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.21070948243141174, - "train/contrastive_loss": 3.9781291484832764, - "train/negative_loss": 2.5855467319488525, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.3925824165344238, - "train/total_loss": 1.0063353776931763 + "train/classification_loss": 0.15908098220825195, + "train/contrastive_loss": 2.679654598236084, + "train/negative_loss": 1.5057131052017212, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.1739414930343628, + "train/total_loss": 0.6950119137763977 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.10843018442392349, - "train/contrastive_loss": 1.2648100852966309, - "train/negative_loss": 0.905613362789154, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.3591967523097992, - "train/total_loss": 0.36139219999313354 + "train/classification_loss": 0.17802831530570984, + "train/contrastive_loss": 2.07833194732666, + "train/negative_loss": 1.31305992603302, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.7652720212936401, + "train/total_loss": 0.5936946868896484 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1718652993440628, - "train/contrastive_loss": 2.080847978591919, - "train/negative_loss": 1.3543455600738525, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.7265024781227112, - "train/total_loss": 0.5880349278450012 + "train/classification_loss": 0.20847803354263306, + "train/contrastive_loss": 2.733017683029175, + "train/negative_loss": 1.0552629232406616, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.6777547597885132, + "train/total_loss": 0.7550815939903259 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.20408809185028076, - "train/contrastive_loss": 1.380002737045288, - "train/negative_loss": 1.0364023447036743, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.34360039234161377, - "train/total_loss": 0.48008865118026733 + "train/classification_loss": 0.17177040874958038, + "train/contrastive_loss": 1.7280198335647583, + "train/negative_loss": 0.7447405457496643, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.983279287815094, + "train/total_loss": 0.5173743963241577 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1612337976694107, - "train/contrastive_loss": 1.6814448833465576, - "train/negative_loss": 1.2421878576278687, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4392569959163666, - "train/total_loss": 0.49752277135849 + "train/classification_loss": 0.17218448221683502, + "train/contrastive_loss": 0.8346590995788574, + "train/negative_loss": 0.834532618522644, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0001264890597667545, + "train/total_loss": 0.33911630511283875 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.14306506514549255, - "train/contrastive_loss": 1.428497076034546, - "train/negative_loss": 1.4083350896835327, + "train/classification_loss": 0.1112944632768631, + "train/contrastive_loss": 1.037398338317871, + "train/negative_loss": 0.5850278735160828, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.020161928609013557, - "train/total_loss": 0.4287644922733307 + "train/positive_loss": 0.4523704946041107, + "train/total_loss": 0.31877413392066956 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.34162014722824097, - "train/contrastive_loss": 3.160057544708252, - "train/negative_loss": 1.740297794342041, + "train/classification_loss": 0.16975441575050354, + "train/contrastive_loss": 2.80088210105896, + "train/negative_loss": 1.5928813219070435, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4197598695755005, - "train/total_loss": 0.9736316800117493 + "train/num_positives": 14, + "train/positive_loss": 1.2080007791519165, + "train/total_loss": 0.7299308776855469 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19791936874389648, - "train/contrastive_loss": 2.956831932067871, - "train/negative_loss": 1.787305474281311, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.1695265769958496, - "train/total_loss": 0.7892857789993286 + "train/classification_loss": 0.13797059655189514, + "train/contrastive_loss": 2.165200710296631, + "train/negative_loss": 0.5847959518432617, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.5804046392440796, + "train/total_loss": 0.5710107088088989 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1189102828502655, - "train/contrastive_loss": 1.6088440418243408, - "train/negative_loss": 0.6195995211601257, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9892444610595703, - "train/total_loss": 0.4406791031360626 + "train/classification_loss": 0.15954400599002838, + "train/contrastive_loss": 1.3343087434768677, + "train/negative_loss": 1.3209974765777588, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.013311277143657207, + "train/total_loss": 0.42640578746795654 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19293628633022308, - "train/contrastive_loss": 2.526085138320923, - "train/negative_loss": 2.007687568664551, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5183975696563721, - "train/total_loss": 0.6981533169746399 + "train/classification_loss": 0.20986954867839813, + "train/contrastive_loss": 4.174795627593994, + "train/negative_loss": 1.9875352382659912, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.187260389328003, + "train/total_loss": 1.0448286533355713 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.10901818424463272, - "train/contrastive_loss": 1.1498570442199707, - "train/negative_loss": 1.1498072147369385, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 4.979323784937151e-05, - "train/total_loss": 0.33898958563804626 + "train/classification_loss": 0.16387797892093658, + "train/contrastive_loss": 1.3689451217651367, + "train/negative_loss": 0.9319843053817749, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.4369608461856842, + "train/total_loss": 0.43766701221466064 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.10920920222997665, - "train/contrastive_loss": 1.7683091163635254, - "train/negative_loss": 1.76611328125, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.002195884706452489, - "train/total_loss": 0.4628710448741913 + "train/classification_loss": 0.14226661622524261, + "train/contrastive_loss": 3.805375099182129, + "train/negative_loss": 0.9238763451576233, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.8814988136291504, + "train/total_loss": 0.9033416509628296 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.13088734447956085, - "train/contrastive_loss": 0.6560176014900208, - "train/negative_loss": 0.5218893885612488, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.13412819802761078, - "train/total_loss": 0.26209086179733276 + "train/classification_loss": 0.16320881247520447, + "train/contrastive_loss": 0.8691606521606445, + "train/negative_loss": 0.3121230900287628, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.5570375323295593, + "train/total_loss": 0.3370409607887268 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.24149109423160553, - "train/contrastive_loss": 2.383913516998291, - "train/negative_loss": 1.2237224578857422, - "train/num_negatives": 40, + "train/classification_loss": 0.1263202279806137, + "train/contrastive_loss": 1.771242380142212, + "train/negative_loss": 0.5729682445526123, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.1601911783218384, - "train/total_loss": 0.7182738184928894 + "train/positive_loss": 1.1982741355895996, + "train/total_loss": 0.48056870698928833 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.15930433571338654, - "train/contrastive_loss": 1.370179295539856, - "train/negative_loss": 0.5785582065582275, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7916210889816284, - "train/total_loss": 0.4333401918411255 + "train/classification_loss": 0.16373278200626373, + "train/contrastive_loss": 0.30273059010505676, + "train/negative_loss": 0.2941136956214905, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.008616908453404903, + "train/total_loss": 0.22427889704704285 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.16022764146327972, - "train/contrastive_loss": 1.2843356132507324, - "train/negative_loss": 1.2842377424240112, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 9.789787873160094e-05, - "train/total_loss": 0.41709476709365845 + "train/classification_loss": 0.14347781240940094, + "train/contrastive_loss": 1.2606143951416016, + "train/negative_loss": 0.46871668100357056, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.791897714138031, + "train/total_loss": 0.39560067653656006 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.15395183861255646, - "train/contrastive_loss": 2.5148231983184814, - "train/negative_loss": 2.402395009994507, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.11242815852165222, - "train/total_loss": 0.6569164991378784 + "train/classification_loss": 0.21395543217658997, + "train/contrastive_loss": 3.584773540496826, + "train/negative_loss": 1.303221344947815, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.2815520763397217, + "train/total_loss": 0.9309101104736328 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.21534916758537292, - "train/contrastive_loss": 1.237306833267212, - "train/negative_loss": 0.262007474899292, - "train/num_negatives": 44, + "train/classification_loss": 0.13279476761817932, + "train/contrastive_loss": 1.4508020877838135, + "train/negative_loss": 1.4372400045394897, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.9752992987632751, - "train/total_loss": 0.4628105163574219 + "train/positive_loss": 0.01356208510696888, + "train/total_loss": 0.422955185174942 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.2336091697216034, - "train/contrastive_loss": 2.2728304862976074, - "train/negative_loss": 1.1783658266067505, - "train/num_negatives": 44, + "train/classification_loss": 0.13371767103672028, + "train/contrastive_loss": 3.249382972717285, + "train/negative_loss": 2.452887773513794, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 1.0944647789001465, - "train/total_loss": 0.6881752610206604 + "train/positive_loss": 0.7964953184127808, + "train/total_loss": 0.7835942506790161 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.13501381874084473, - "train/contrastive_loss": 1.4717390537261963, - "train/negative_loss": 0.5643835067749023, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.907355546951294, - "train/total_loss": 0.42936164140701294 + "train/classification_loss": 0.15158793330192566, + "train/contrastive_loss": 1.7863094806671143, + "train/negative_loss": 1.6163197755813599, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.169989675283432, + "train/total_loss": 0.5088498592376709 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1274745911359787, - "train/contrastive_loss": 0.5078569054603577, - "train/negative_loss": 0.18285803496837616, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.3249988555908203, - "train/total_loss": 0.22904597222805023 + "train/classification_loss": 0.2671091854572296, + "train/contrastive_loss": 2.83126163482666, + "train/negative_loss": 1.3494688272476196, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.48179292678833, + "train/total_loss": 0.8333615064620972 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.08682894706726074, - "train/contrastive_loss": 0.8233351707458496, - "train/negative_loss": 0.18787714838981628, + "train/classification_loss": 0.1736839860677719, + "train/contrastive_loss": 1.984739065170288, + "train/negative_loss": 0.40271276235580444, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6354579925537109, - "train/total_loss": 0.25149598717689514 + "train/num_positives": 10, + "train/positive_loss": 1.5820263624191284, + "train/total_loss": 0.5706318020820618 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.24888063967227936, - "train/contrastive_loss": 1.2541038990020752, - "train/negative_loss": 0.1854996383190155, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.0686042308807373, - "train/total_loss": 0.49970144033432007 + "train/classification_loss": 0.20055411756038666, + "train/contrastive_loss": 2.465477466583252, + "train/negative_loss": 1.534045934677124, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9314315319061279, + "train/total_loss": 0.6936495900154114 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.26805534958839417, - "train/contrastive_loss": 3.19677734375, - "train/negative_loss": 1.6616671085357666, + "train/classification_loss": 0.1925583779811859, + "train/contrastive_loss": 2.431614637374878, + "train/negative_loss": 2.1127984523773193, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.535110354423523, - "train/total_loss": 0.9074108600616455 + "train/num_positives": 4, + "train/positive_loss": 0.3188161551952362, + "train/total_loss": 0.6788812875747681 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.15668313205242157, - "train/contrastive_loss": 3.104414701461792, - "train/negative_loss": 2.506190299987793, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5982244610786438, - "train/total_loss": 0.7775660753250122 + "train/classification_loss": 0.18313775956630707, + "train/contrastive_loss": 0.34710225462913513, + "train/negative_loss": 0.2658122479915619, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.08129000663757324, + "train/total_loss": 0.2525582015514374 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19333301484584808, - "train/contrastive_loss": 1.5682584047317505, - "train/negative_loss": 0.8982338309288025, - "train/num_negatives": 40, + "train/classification_loss": 0.27189186215400696, + "train/contrastive_loss": 3.0423965454101562, + "train/negative_loss": 1.3593348264694214, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.670024573802948, - "train/total_loss": 0.5069847106933594 - }, - { - "epoch": 11.02661596958175, - "step": 2900, - "train/classification_loss": 0.2154930979013443, - "train/contrastive_loss": 1.477970838546753, - "train/negative_loss": 1.0649974346160889, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.4129733443260193, - "train/total_loss": 0.5110872983932495 - }, - { - "epoch": 11.02661596958175, - "step": 2900, - "train/classification_loss": 0.13846148550510406, - "train/contrastive_loss": 2.8543951511383057, - "train/negative_loss": 1.7028539180755615, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.1515412330627441, - "train/total_loss": 0.709340512752533 + "train/positive_loss": 1.6830615997314453, + "train/total_loss": 0.8803712129592896 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.22234424948692322, - "train/contrastive_loss": 2.5295867919921875, - "train/negative_loss": 1.629623532295227, + "train/classification_loss": 0.17986933887004852, + "train/contrastive_loss": 0.6659830212593079, + "train/negative_loss": 0.6557236909866333, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8999632000923157, - "train/total_loss": 0.7282615900039673 - }, - { - "epoch": 11.02661596958175, - "step": 2900, - "train/classification_loss": 0.18698523938655853, - "train/contrastive_loss": 0.7199073433876038, - "train/negative_loss": 0.7184258699417114, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0014814974274486303, - "train/total_loss": 0.3309667110443115 + "train/num_positives": 10, + "train/positive_loss": 0.010259347967803478, + "train/total_loss": 0.31306594610214233 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.169067844748497, - "train/contrastive_loss": 0.9233545064926147, - "train/negative_loss": 0.8584201335906982, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.06493434309959412, - "train/total_loss": 0.3537387549877167 + "train/classification_loss": 0.18539486825466156, + "train/contrastive_loss": 1.5846210718154907, + "train/negative_loss": 1.367700457572937, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.21692058444023132, + "train/total_loss": 0.5023190975189209 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.20981365442276, - "train/contrastive_loss": 3.609513759613037, - "train/negative_loss": 2.6516473293304443, + "train/classification_loss": 0.14992345869541168, + "train/contrastive_loss": 2.1614699363708496, + "train/negative_loss": 1.3060417175292969, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.9578664898872375, - "train/total_loss": 0.9317164421081543 + "train/positive_loss": 0.8554282188415527, + "train/total_loss": 0.5822174549102783 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.17624883353710175, - "train/contrastive_loss": 3.19402813911438, - "train/negative_loss": 1.5648763179779053, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.6291518211364746, - "train/total_loss": 0.8150544762611389 + "train/classification_loss": 0.18701496720314026, + "train/contrastive_loss": 2.342538595199585, + "train/negative_loss": 1.2122130393981934, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.1303255558013916, + "train/total_loss": 0.6555227041244507 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.15087518095970154, - "train/contrastive_loss": 1.352403163909912, - "train/negative_loss": 1.021414875984192, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.33098822832107544, - "train/total_loss": 0.42135581374168396 + "train/classification_loss": 0.22230593860149384, + "train/contrastive_loss": 2.030838966369629, + "train/negative_loss": 1.4303054809570312, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.6005334854125977, + "train/total_loss": 0.6284737586975098 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1728045493364334, - "train/contrastive_loss": 1.014013648033142, - "train/negative_loss": 0.9988958835601807, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.015117738395929337, - "train/total_loss": 0.37560728192329407 + "train/classification_loss": 0.20898309350013733, + "train/contrastive_loss": 1.478989839553833, + "train/negative_loss": 0.8801543712615967, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5988355278968811, + "train/total_loss": 0.5047810673713684 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.21599125862121582, - "train/contrastive_loss": 1.8973764181137085, - "train/negative_loss": 1.7870030403137207, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.11037334054708481, - "train/total_loss": 0.5954665541648865 + "train/classification_loss": 0.13425864279270172, + "train/contrastive_loss": 1.332768440246582, + "train/negative_loss": 1.3266702890396118, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.006098171230405569, + "train/total_loss": 0.4008123278617859 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.18479114770889282, - "train/contrastive_loss": 2.3830597400665283, - "train/negative_loss": 2.3785526752471924, + "train/classification_loss": 0.22147367894649506, + "train/contrastive_loss": 2.37888240814209, + "train/negative_loss": 0.39433708786964417, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.004507133737206459, - "train/total_loss": 0.6614030599594116 + "train/num_positives": 8, + "train/positive_loss": 1.984545350074768, + "train/total_loss": 0.6972501873970032 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.17315959930419922, - "train/contrastive_loss": 0.8763577938079834, - "train/negative_loss": 0.766486406326294, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.10987141728401184, - "train/total_loss": 0.34843116998672485 + "train/classification_loss": 0.24031203985214233, + "train/contrastive_loss": 3.3356821537017822, + "train/negative_loss": 3.214360475540161, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.12132158875465393, + "train/total_loss": 0.9074484705924988 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1737559586763382, - "train/contrastive_loss": 2.532794952392578, - "train/negative_loss": 1.97202467918396, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.5607703924179077, - "train/total_loss": 0.6803149580955505 + "train/classification_loss": 0.2125992327928543, + "train/contrastive_loss": 1.0687923431396484, + "train/negative_loss": 0.4468400478363037, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.6219522356987, + "train/total_loss": 0.4263576865196228 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.20850807428359985, - "train/contrastive_loss": 1.5471532344818115, - "train/negative_loss": 0.571214497089386, + "train/classification_loss": 0.29739734530448914, + "train/contrastive_loss": 4.781063556671143, + "train/negative_loss": 2.208695888519287, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.9759386777877808, - "train/total_loss": 0.5179387331008911 + "train/num_positives": 8, + "train/positive_loss": 2.5723676681518555, + "train/total_loss": 1.2536100149154663 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.15292558073997498, - "train/contrastive_loss": 3.26169490814209, - "train/negative_loss": 1.487465262413025, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7742295265197754, - "train/total_loss": 0.8052645921707153 + "train/classification_loss": 0.13947837054729462, + "train/contrastive_loss": 1.1287579536437988, + "train/negative_loss": 0.5803136229515076, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.5484442710876465, + "train/total_loss": 0.3652299642562866 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.14589259028434753, - "train/contrastive_loss": 1.0803455114364624, - "train/negative_loss": 0.5692500472068787, - "train/num_negatives": 40, + "train/classification_loss": 0.17628394067287445, + "train/contrastive_loss": 2.966888904571533, + "train/negative_loss": 1.6621443033218384, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.5110954642295837, - "train/total_loss": 0.36196169257164 + "train/positive_loss": 1.3047444820404053, + "train/total_loss": 0.7696617245674133 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.27761170268058777, - "train/contrastive_loss": 1.4024109840393066, - "train/negative_loss": 0.937574565410614, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.4648364782333374, - "train/total_loss": 0.5580939054489136 + "train/classification_loss": 0.14822180569171906, + "train/contrastive_loss": 0.5378744006156921, + "train/negative_loss": 0.5378078818321228, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 6.652127194683999e-05, + "train/total_loss": 0.2557966709136963 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1080985888838768, - "train/contrastive_loss": 1.0187591314315796, - "train/negative_loss": 1.0187575817108154, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.549722128402209e-06, - "train/total_loss": 0.3118504285812378 + "train/classification_loss": 0.28061428666114807, + "train/contrastive_loss": 2.16581392288208, + "train/negative_loss": 1.159152865409851, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.0066609382629395, + "train/total_loss": 0.7137770652770996 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.11279600113630295, - "train/contrastive_loss": 0.42314082384109497, - "train/negative_loss": 0.20568686723709106, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.2174539715051651, - "train/total_loss": 0.19742417335510254 + "train/classification_loss": 0.15342897176742554, + "train/contrastive_loss": 0.7659542560577393, + "train/negative_loss": 0.7608383893966675, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.005115843378007412, + "train/total_loss": 0.3066198229789734 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.08670825511217117, - "train/contrastive_loss": 0.8059331178665161, - "train/negative_loss": 0.8044592142105103, + "train/classification_loss": 0.32758885622024536, + "train/contrastive_loss": 1.8111205101013184, + "train/negative_loss": 0.9260818362236023, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0014739001635462046, - "train/total_loss": 0.24789488315582275 + "train/num_positives": 18, + "train/positive_loss": 0.8850387334823608, + "train/total_loss": 0.689812958240509 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.17622320353984833, - "train/contrastive_loss": 1.575151801109314, - "train/negative_loss": 1.3429945707321167, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.23215720057487488, - "train/total_loss": 0.4912535548210144 + "train/classification_loss": 0.13064444065093994, + "train/contrastive_loss": 2.8732028007507324, + "train/negative_loss": 0.8690221905708313, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.004180669784546, + "train/total_loss": 0.7052850127220154 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.13294516503810883, - "train/contrastive_loss": 1.4039270877838135, - "train/negative_loss": 0.7784045934677124, + "train/classification_loss": 0.16293343901634216, + "train/contrastive_loss": 2.437732219696045, + "train/negative_loss": 2.081183433532715, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.6255224347114563, - "train/total_loss": 0.41373056173324585 + "train/positive_loss": 0.35654887557029724, + "train/total_loss": 0.6504799127578735 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.14768970012664795, - "train/contrastive_loss": 0.34889325499534607, - "train/negative_loss": 0.34836727380752563, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0005259931785985827, - "train/total_loss": 0.21746835112571716 + "train/classification_loss": 0.2592998445034027, + "train/contrastive_loss": 2.084942102432251, + "train/negative_loss": 2.08493971824646, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 2.2649790025752736e-06, + "train/total_loss": 0.6762882471084595 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19090229272842407, - "train/contrastive_loss": 2.0051064491271973, - "train/negative_loss": 0.9063347578048706, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.098771572113037, - "train/total_loss": 0.5919235944747925 + "train/classification_loss": 0.2063748985528946, + "train/contrastive_loss": 2.7614307403564453, + "train/negative_loss": 1.3759068250656128, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.3855239152908325, + "train/total_loss": 0.7586610317230225 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.24010302126407623, - "train/contrastive_loss": 3.3736112117767334, - "train/negative_loss": 2.383720874786377, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.9898903965950012, - "train/total_loss": 0.9148252606391907 + "train/classification_loss": 0.12094295769929886, + "train/contrastive_loss": 0.18382498621940613, + "train/negative_loss": 0.15728388726711273, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.026541098952293396, + "train/total_loss": 0.15770795941352844 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.12910862267017365, - "train/contrastive_loss": 0.9344525337219238, - "train/negative_loss": 0.29654988646507263, + "train/classification_loss": 0.19040244817733765, + "train/contrastive_loss": 1.179012656211853, + "train/negative_loss": 0.9204587936401367, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.6379026174545288, - "train/total_loss": 0.3159991502761841 + "train/num_positives": 8, + "train/positive_loss": 0.2585538625717163, + "train/total_loss": 0.42620497941970825 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1627723127603531, - "train/contrastive_loss": 2.9348855018615723, - "train/negative_loss": 1.5333905220031738, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.4014949798583984, - "train/total_loss": 0.7497494220733643 + "train/classification_loss": 0.18006786704063416, + "train/contrastive_loss": 1.1357351541519165, + "train/negative_loss": 0.9125902056694031, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.22314494848251343, + "train/total_loss": 0.407214879989624 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.26201459765434265, - "train/contrastive_loss": 3.4043643474578857, - "train/negative_loss": 1.4179768562316895, - "train/num_negatives": 46, + "train/classification_loss": 0.2964591383934021, + "train/contrastive_loss": 3.240980386734009, + "train/negative_loss": 1.3075833320617676, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 1.9863874912261963, - "train/total_loss": 0.9428874254226685 + "train/positive_loss": 1.9333970546722412, + "train/total_loss": 0.9446552395820618 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.21741798520088196, - "train/contrastive_loss": 3.4402925968170166, - "train/negative_loss": 1.4437909126281738, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.9965016841888428, - "train/total_loss": 0.9054765701293945 + "train/classification_loss": 0.15920165181159973, + "train/contrastive_loss": 0.689811110496521, + "train/negative_loss": 0.49601730704307556, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.19379381835460663, + "train/total_loss": 0.29716387391090393 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.19118881225585938, - "train/contrastive_loss": 2.8007559776306152, - "train/negative_loss": 1.9305254220962524, + "train/classification_loss": 0.13423670828342438, + "train/contrastive_loss": 1.5894420146942139, + "train/negative_loss": 0.7994976043701172, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.8702306151390076, - "train/total_loss": 0.7513400316238403 + "train/positive_loss": 0.7899444699287415, + "train/total_loss": 0.4521251320838928 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.14847001433372498, + "train/contrastive_loss": 1.1185154914855957, + "train/negative_loss": 0.5615684390068054, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5569469928741455, + "train/total_loss": 0.37217313051223755 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.2418469339609146, - "train/contrastive_loss": 4.18387508392334, - "train/negative_loss": 2.1317081451416016, + "train/classification_loss": 0.19374050199985504, + "train/contrastive_loss": 4.017642021179199, + "train/negative_loss": 2.2876029014587402, "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.730039119720459, + "train/total_loss": 0.9972689151763916 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.19868767261505127, + "train/contrastive_loss": 1.0947338342666626, + "train/negative_loss": 0.5714030265808105, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.523330807685852, + "train/total_loss": 0.41763442754745483 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.08811814337968826, + "train/contrastive_loss": 0.2297048419713974, + "train/negative_loss": 0.2284664362668991, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.0012384126894176006, + "train/total_loss": 0.1340591162443161 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.19191573560237885, + "train/contrastive_loss": 2.388416290283203, + "train/negative_loss": 1.7922662496566772, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 2.0521669387817383, - "train/total_loss": 1.0786219835281372 + "train/positive_loss": 0.5961501002311707, + "train/total_loss": 0.6695989966392517 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.21268275380134583, - "train/contrastive_loss": 3.620016574859619, - "train/negative_loss": 2.7963509559631348, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.8236655592918396, - "train/total_loss": 0.9366860389709473 + "train/classification_loss": 0.20889155566692352, + "train/contrastive_loss": 1.2571130990982056, + "train/negative_loss": 1.2430636882781982, + "train/num_negatives": 46, + "train/num_positives": 2, + "train/positive_loss": 0.014049414545297623, + "train/total_loss": 0.46031415462493896 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.1371251493692398, + "train/contrastive_loss": 1.5753488540649414, + "train/negative_loss": 0.7840390801429749, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.7913098335266113, + "train/total_loss": 0.4521949291229248 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.23302072286605835, + "train/contrastive_loss": 2.856095314025879, + "train/negative_loss": 1.8790549039840698, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.9770404696464539, + "train/total_loss": 0.804239809513092 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.16038738191127777, + "train/contrastive_loss": 2.011524200439453, + "train/negative_loss": 0.7170014977455139, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.294522762298584, + "train/total_loss": 0.5626922249794006 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.28219375014305115, - "train/contrastive_loss": 3.8104820251464844, - "train/negative_loss": 2.135993719100952, + "train/classification_loss": 0.1599067747592926, + "train/contrastive_loss": 5.245911121368408, + "train/negative_loss": 5.245909690856934, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.5854857338126749e-06, + "train/total_loss": 1.2090890407562256 + }, + { + "epoch": 10.211267605633802, + "step": 2900, + "train/classification_loss": 0.16568949818611145, + "train/contrastive_loss": 0.7083851099014282, + "train/negative_loss": 0.4586718678474426, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.6744883060455322, - "train/total_loss": 1.0442901849746704 + "train/positive_loss": 0.2497132271528244, + "train/total_loss": 0.3073665201663971 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.17107729613780975, - "train/contrastive_loss": 0.7542315125465393, - "train/negative_loss": 0.6879888772964478, + "train/classification_loss": 0.21125702559947968, + "train/contrastive_loss": 2.7015156745910645, + "train/negative_loss": 1.6683448553085327, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.06624261289834976, - "train/total_loss": 0.3219236135482788 + "train/num_positives": 8, + "train/positive_loss": 1.0331707000732422, + "train/total_loss": 0.7515602111816406 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.17708244919776917, - "train/contrastive_loss": 1.7290434837341309, - "train/negative_loss": 1.5278027057647705, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.20124076306819916, - "train/total_loss": 0.5228911638259888 + "train/classification_loss": 0.16208994388580322, + "train/contrastive_loss": 2.0591349601745605, + "train/negative_loss": 0.8783535957336426, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.1807812452316284, + "train/total_loss": 0.5739169120788574 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.11657316982746124, - "train/contrastive_loss": 0.8646166324615479, - "train/negative_loss": 0.3449186384677887, - "train/num_negatives": 46, + "train/classification_loss": 0.26127591729164124, + "train/contrastive_loss": 1.510298252105713, + "train/negative_loss": 1.1916983127593994, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.5196980237960815, - "train/total_loss": 0.2894964814186096 + "train/positive_loss": 0.31859999895095825, + "train/total_loss": 0.5633355379104614 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.20022404193878174, - "train/contrastive_loss": 1.728529453277588, - "train/negative_loss": 1.728529453277588, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5459299087524414 - }, - { - "epoch": 11.02661596958175, - "eval_exact_match_accuracy": 0.31238095238095237, - "eval_hamming_loss": 0.06554621848739496, - "eval_loss": 0.5652662515640259, - "eval_macro_f1": 0.35633481687177776, - "eval_macro_precision": 0.5754560174818795, - "eval_macro_recall": 0.2821388056574931, - "eval_micro_f1": 0.5763939174511223, - "eval_micro_precision": 0.7928286852589641, - "eval_micro_recall": 0.4527872582480091, - "eval_runtime": 2.6257, - "eval_samples_per_second": 199.944, - "eval_steps_per_second": 25.136, + "train/classification_loss": 0.16329923272132874, + "train/contrastive_loss": 1.3590660095214844, + "train/negative_loss": 0.9801003336906433, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.37896573543548584, + "train/total_loss": 0.43511244654655457 + }, + { + "epoch": 10.211267605633802, + "eval_exact_match_accuracy": 0.32275132275132273, + "eval_hamming_loss": 0.06463326071169208, + "eval_loss": 0.5829338431358337, + "eval_macro_f1": 0.4351002757555069, + "eval_macro_precision": 0.6404843330845489, + "eval_macro_recall": 0.3521258198223301, + "eval_micro_f1": 0.5787694388100068, + "eval_micro_precision": 0.7911275415896488, + "eval_micro_recall": 0.4562899786780384, + "eval_runtime": 2.8488, + "eval_samples_per_second": 199.031, + "eval_steps_per_second": 24.923, "step": 2900 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.12048979103565216, - "train/contrastive_loss": 0.4127001166343689, - "train/negative_loss": 0.4125082194805145, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.0001919057685881853, - "train/total_loss": 0.2030298113822937 + "train/classification_loss": 0.10593006759881973, + "train/contrastive_loss": 0.6669097542762756, + "train/negative_loss": 0.6588942408561707, + "train/num_negatives": 36, + "train/num_positives": 20, + "train/positive_loss": 0.008015519939363003, + "train/total_loss": 0.23931202292442322 }, { - "epoch": 11.02661596958175, + "epoch": 10.211267605633802, "step": 2900, - "train/classification_loss": 0.1277117133140564, - "train/contrastive_loss": 0.9486163854598999, - "train/negative_loss": 0.9009051322937012, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.04771128296852112, - "train/total_loss": 0.31743499636650085 + "train/classification_loss": 0.14086495339870453, + "train/contrastive_loss": 1.5772793292999268, + "train/negative_loss": 1.271799087524414, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 0.3054801821708679, + "train/total_loss": 0.4563208222389221 }, { - "epoch": 11.216730038022813, - "grad_norm": 7.097142219543457, - "learning_rate": 1.956666666666667e-05, - "loss": 0.5958, + "epoch": 10.387323943661972, + "grad_norm": 14.002019882202148, + "learning_rate": 1.9598872445384076e-05, + "loss": 0.6253, "step": 2950 }, { - "epoch": 11.216730038022813, + "epoch": 10.387323943661972, "step": 2950, - "train/classification_loss": 0.09659489244222641, - "train/contrastive_loss": 0.32379037141799927, - "train/negative_loss": 0.32296091318130493, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.0008294543367810547, - "train/total_loss": 0.1613529622554779 + "train/classification_loss": 0.07413940131664276, + "train/contrastive_loss": 0.1552697718143463, + "train/negative_loss": 0.13997884094715118, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.015290931798517704, + "train/total_loss": 0.1051933541893959 }, { - "epoch": 11.216730038022813, + "epoch": 10.387323943661972, "step": 2950, - "train/classification_loss": 0.12459646910429001, - "train/contrastive_loss": 0.9049633741378784, - "train/negative_loss": 0.6516837477684021, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.2532796561717987, - "train/total_loss": 0.30558913946151733 + "train/classification_loss": 0.1367824524641037, + "train/contrastive_loss": 0.5186465978622437, + "train/negative_loss": 0.5146605968475342, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.00398603081703186, + "train/total_loss": 0.24051177501678467 }, { - "epoch": 11.406844106463879, - "grad_norm": 8.175446510314941, - "learning_rate": 1.9559056316590565e-05, - "loss": 0.5599, + "epoch": 10.56338028169014, + "grad_norm": 11.690299987792969, + "learning_rate": 1.9591825229034534e-05, + "loss": 0.6032, "step": 3000 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2460077553987503, - "train/contrastive_loss": 1.7875924110412598, - "train/negative_loss": 1.0787734985351562, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.7088188529014587, - "train/total_loss": 0.60352623462677 + "train/classification_loss": 0.2762620747089386, + "train/contrastive_loss": 2.3873162269592285, + "train/negative_loss": 1.5687317848205566, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.8185845613479614, + "train/total_loss": 0.7537252902984619 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16835083067417145, - "train/contrastive_loss": 1.5462809801101685, - "train/negative_loss": 1.1407911777496338, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.40548980236053467, - "train/total_loss": 0.47760701179504395 + "train/classification_loss": 0.25543755292892456, + "train/contrastive_loss": 1.2461047172546387, + "train/negative_loss": 0.472343385219574, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.7737613916397095, + "train/total_loss": 0.5046585202217102 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16128778457641602, - "train/contrastive_loss": 1.2429862022399902, - "train/negative_loss": 0.28416210412979126, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.9588241577148438, - "train/total_loss": 0.409885048866272 + "train/classification_loss": 0.23958174884319305, + "train/contrastive_loss": 2.76216459274292, + "train/negative_loss": 1.3364864587783813, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.425678014755249, + "train/total_loss": 0.7920147180557251 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.22657646238803864, - "train/contrastive_loss": 3.7108354568481445, - "train/negative_loss": 2.5892937183380127, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.1215416193008423, - "train/total_loss": 0.9687435626983643 + "train/classification_loss": 0.16245520114898682, + "train/contrastive_loss": 2.3808512687683105, + "train/negative_loss": 1.7466623783111572, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.6341889500617981, + "train/total_loss": 0.6386255025863647 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.10366299003362656, - "train/contrastive_loss": 1.2759945392608643, - "train/negative_loss": 1.080255150794983, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.19573932886123657, - "train/total_loss": 0.35886192321777344 + "train/classification_loss": 0.2083040475845337, + "train/contrastive_loss": 2.8997902870178223, + "train/negative_loss": 2.8517308235168457, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.04805942624807358, + "train/total_loss": 0.788262128829956 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.17348365485668182, - "train/contrastive_loss": 1.8329436779022217, - "train/negative_loss": 1.212402582168579, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.6205410957336426, - "train/total_loss": 0.5400723814964294 + "train/classification_loss": 0.20814986526966095, + "train/contrastive_loss": 2.683485507965088, + "train/negative_loss": 1.347381591796875, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.3361037969589233, + "train/total_loss": 0.7448469400405884 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.21991436183452606, - "train/contrastive_loss": 2.166783571243286, - "train/negative_loss": 1.3268084526062012, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.8399750590324402, - "train/total_loss": 0.6532710790634155 + "train/classification_loss": 0.19245050847530365, + "train/contrastive_loss": 2.4646382331848145, + "train/negative_loss": 1.1738001108169556, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.2908380031585693, + "train/total_loss": 0.6853781342506409 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.15702003240585327, - "train/contrastive_loss": 1.737476110458374, - "train/negative_loss": 1.2656153440475464, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4718608260154724, - "train/total_loss": 0.5045152902603149 + "train/classification_loss": 0.19908642768859863, + "train/contrastive_loss": 1.0945513248443604, + "train/negative_loss": 1.0945110321044922, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 4.0293551137438044e-05, + "train/total_loss": 0.41799670457839966 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12862704694271088, - "train/contrastive_loss": 0.9805291295051575, - "train/negative_loss": 0.9593443870544434, + "train/classification_loss": 0.10663730651140213, + "train/contrastive_loss": 0.43518689274787903, + "train/negative_loss": 0.4090810716152191, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.021184762939810753, - "train/total_loss": 0.32473286986351013 + "train/positive_loss": 0.02610582672059536, + "train/total_loss": 0.19367468357086182 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.33259037137031555, - "train/contrastive_loss": 3.059068202972412, - "train/negative_loss": 1.5818933248519897, + "train/classification_loss": 0.1675368696451187, + "train/contrastive_loss": 1.748020887374878, + "train/negative_loss": 0.7628961801528931, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4771747589111328, - "train/total_loss": 0.9444040060043335 + "train/num_positives": 14, + "train/positive_loss": 0.9851246476173401, + "train/total_loss": 0.5171410441398621 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.18981976807117462, - "train/contrastive_loss": 3.0175364017486572, - "train/negative_loss": 1.7657978534698486, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.2517385482788086, - "train/total_loss": 0.7933270335197449 + "train/classification_loss": 0.1484692394733429, + "train/contrastive_loss": 1.2832281589508057, + "train/negative_loss": 0.8856143951416016, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3976137340068817, + "train/total_loss": 0.40511488914489746 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.11571092903614044, - "train/contrastive_loss": 1.3443200588226318, - "train/negative_loss": 0.5773237347602844, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.7669963836669922, - "train/total_loss": 0.3845749497413635 + "train/classification_loss": 0.15774308145046234, + "train/contrastive_loss": 1.4628280401229858, + "train/negative_loss": 1.3172005414962769, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.14562752842903137, + "train/total_loss": 0.4503086805343628 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1516052633523941, - "train/contrastive_loss": 2.145120143890381, - "train/negative_loss": 2.1333134174346924, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.011806661263108253, - "train/total_loss": 0.580629289150238 + "train/classification_loss": 0.20536047220230103, + "train/contrastive_loss": 3.2447919845581055, + "train/negative_loss": 1.9048564434051514, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.339935541152954, + "train/total_loss": 0.8543188571929932 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12423818558454514, - "train/contrastive_loss": 2.328566551208496, - "train/negative_loss": 2.328213930130005, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.00035253219539299607, - "train/total_loss": 0.5899515151977539 + "train/classification_loss": 0.1619938760995865, + "train/contrastive_loss": 1.0439677238464355, + "train/negative_loss": 0.6946704983711243, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.34929725527763367, + "train/total_loss": 0.37078744173049927 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.09402937442064285, - "train/contrastive_loss": 0.8607133626937866, - "train/negative_loss": 0.8522325754165649, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.008480768650770187, - "train/total_loss": 0.26617205142974854 + "train/classification_loss": 0.14412476122379303, + "train/contrastive_loss": 3.019122838973999, + "train/negative_loss": 0.9273945689201355, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.0917282104492188, + "train/total_loss": 0.7479493021965027 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12282104790210724, - "train/contrastive_loss": 0.43985193967819214, - "train/negative_loss": 0.2673581838607788, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.17249377071857452, - "train/total_loss": 0.2107914388179779 + "train/classification_loss": 0.1468760371208191, + "train/contrastive_loss": 0.5179504752159119, + "train/negative_loss": 0.37436434626579285, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.14358612895011902, + "train/total_loss": 0.25046613812446594 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2313510924577713, - "train/contrastive_loss": 2.0404858589172363, - "train/negative_loss": 1.2266383171081543, - "train/num_negatives": 40, + "train/classification_loss": 0.11221809685230255, + "train/contrastive_loss": 0.8565540313720703, + "train/negative_loss": 0.5195607542991638, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8138476610183716, - "train/total_loss": 0.6394482851028442 + "train/positive_loss": 0.3369932770729065, + "train/total_loss": 0.2835289239883423 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16369837522506714, - "train/contrastive_loss": 1.371705412864685, - "train/negative_loss": 0.4722364544868469, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8994689583778381, - "train/total_loss": 0.4380394518375397 + "train/classification_loss": 0.1688118875026703, + "train/contrastive_loss": 0.9327883720397949, + "train/negative_loss": 0.3360637128353119, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.5967246294021606, + "train/total_loss": 0.35536956787109375 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.18732303380966187, - "train/contrastive_loss": 2.1580970287323, - "train/negative_loss": 2.154425859451294, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.003671215381473303, - "train/total_loss": 0.6189424395561218 + "train/classification_loss": 0.15971487760543823, + "train/contrastive_loss": 2.3112308979034424, + "train/negative_loss": 0.8913699984550476, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 1.4198609590530396, + "train/total_loss": 0.6219610571861267 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.14963382482528687, - "train/contrastive_loss": 2.013792037963867, - "train/negative_loss": 1.361496925354004, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6522949934005737, - "train/total_loss": 0.5523922443389893 + "train/classification_loss": 0.21708834171295166, + "train/contrastive_loss": 3.3200504779815674, + "train/negative_loss": 1.1901757717132568, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.1298747062683105, + "train/total_loss": 0.8810984492301941 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.20522984862327576, - "train/contrastive_loss": 1.5552414655685425, - "train/negative_loss": 0.36278292536735535, - "train/num_negatives": 44, + "train/classification_loss": 0.1149444729089737, + "train/contrastive_loss": 1.7186161279678345, + "train/negative_loss": 1.7137479782104492, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.1924585103988647, - "train/total_loss": 0.5162781476974487 + "train/positive_loss": 0.004868112504482269, + "train/total_loss": 0.45866769552230835 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.23116886615753174, - "train/contrastive_loss": 1.6908693313598633, - "train/negative_loss": 1.1880009174346924, - "train/num_negatives": 44, + "train/classification_loss": 0.13831518590450287, + "train/contrastive_loss": 3.3318591117858887, + "train/negative_loss": 2.577338218688965, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.5028684735298157, - "train/total_loss": 0.5693427324295044 + "train/positive_loss": 0.7545210123062134, + "train/total_loss": 0.8046870231628418 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1303163319826126, - "train/contrastive_loss": 1.3386789560317993, - "train/negative_loss": 0.538434624671936, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.8002443313598633, - "train/total_loss": 0.3980521559715271 + "train/classification_loss": 0.14285585284233093, + "train/contrastive_loss": 1.9449069499969482, + "train/negative_loss": 0.8926212787628174, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 1.0522856712341309, + "train/total_loss": 0.5318372249603271 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12415100634098053, - "train/contrastive_loss": 0.37868618965148926, - "train/negative_loss": 0.1813802421092987, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.19730594754219055, - "train/total_loss": 0.19988824427127838 + "train/classification_loss": 0.23551133275032043, + "train/contrastive_loss": 2.9736928939819336, + "train/negative_loss": 1.9470629692077637, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.02662992477417, + "train/total_loss": 0.8302499055862427 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.08950117230415344, - "train/contrastive_loss": 1.1763198375701904, - "train/negative_loss": 0.6714333891868591, + "train/classification_loss": 0.1685134321451187, + "train/contrastive_loss": 2.478376865386963, + "train/negative_loss": 1.3601411581039429, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5048865079879761, - "train/total_loss": 0.324765145778656 + "train/num_positives": 10, + "train/positive_loss": 1.11823570728302, + "train/total_loss": 0.664188802242279 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2535746097564697, - "train/contrastive_loss": 1.4467504024505615, - "train/negative_loss": 0.10707000643014908, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3396804332733154, - "train/total_loss": 0.542924702167511 + "train/classification_loss": 0.2670794427394867, + "train/contrastive_loss": 3.8331222534179688, + "train/negative_loss": 2.744384765625, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0887373685836792, + "train/total_loss": 1.0337039232254028 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2579728364944458, - "train/contrastive_loss": 3.5354440212249756, - "train/negative_loss": 1.3759825229644775, + "train/classification_loss": 0.1832488775253296, + "train/contrastive_loss": 2.2549726963043213, + "train/negative_loss": 2.2538952827453613, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 2.159461498260498, - "train/total_loss": 0.9650616645812988 + "train/num_positives": 4, + "train/positive_loss": 0.001077397377230227, + "train/total_loss": 0.6342434287071228 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1573730707168579, - "train/contrastive_loss": 2.817941427230835, - "train/negative_loss": 2.300238847732544, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5177025198936462, - "train/total_loss": 0.7209613919258118 + "train/classification_loss": 0.2047833800315857, + "train/contrastive_loss": 1.1822214126586914, + "train/negative_loss": 1.1603710651397705, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.021850330755114555, + "train/total_loss": 0.44122767448425293 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.17016902565956116, - "train/contrastive_loss": 1.3016204833984375, - "train/negative_loss": 0.8056268095970154, - "train/num_negatives": 40, + "train/classification_loss": 0.2744237780570984, + "train/contrastive_loss": 3.28920841217041, + "train/negative_loss": 1.2559646368026733, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.49599361419677734, - "train/total_loss": 0.4304931163787842 + "train/positive_loss": 2.0332438945770264, + "train/total_loss": 0.9322654604911804 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2269555926322937, - "train/contrastive_loss": 1.9593873023986816, - "train/negative_loss": 1.5597097873687744, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.39967745542526245, - "train/total_loss": 0.618833065032959 + "train/classification_loss": 0.18878227472305298, + "train/contrastive_loss": 0.6206185817718506, + "train/negative_loss": 0.6101956367492676, + "train/num_negatives": 38, + "train/num_positives": 10, + "train/positive_loss": 0.01042292919009924, + "train/total_loss": 0.3129059970378876 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.13402676582336426, - "train/contrastive_loss": 2.7644128799438477, - "train/negative_loss": 1.5623483657836914, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.2020645141601562, - "train/total_loss": 0.6869093775749207 + "train/classification_loss": 0.18836022913455963, + "train/contrastive_loss": 1.750382423400879, + "train/negative_loss": 1.3351140022277832, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.4152684807777405, + "train/total_loss": 0.5384367108345032 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.22593103349208832, - "train/contrastive_loss": 2.2663116455078125, - "train/negative_loss": 1.1768672466278076, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0894443988800049, - "train/total_loss": 0.679193377494812 + "train/classification_loss": 0.1622367799282074, + "train/contrastive_loss": 3.5931925773620605, + "train/negative_loss": 2.5476036071777344, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0455890893936157, + "train/total_loss": 0.8808753490447998 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.24519100785255432, - "train/contrastive_loss": 1.1132460832595825, - "train/negative_loss": 1.1125224828720093, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007235640659928322, - "train/total_loss": 0.4678402245044708 + "train/classification_loss": 0.1841551810503006, + "train/contrastive_loss": 1.511103868484497, + "train/negative_loss": 0.9502866864204407, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.5608171820640564, + "train/total_loss": 0.48637598752975464 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.17888036370277405, - "train/contrastive_loss": 0.8936871290206909, - "train/negative_loss": 0.5934308171272278, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.3002563416957855, - "train/total_loss": 0.3576177954673767 + "train/classification_loss": 0.26156654953956604, + "train/contrastive_loss": 2.263023853302002, + "train/negative_loss": 1.9572700262069702, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.3057537078857422, + "train/total_loss": 0.714171290397644 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.20060838758945465, - "train/contrastive_loss": 3.2346978187561035, - "train/negative_loss": 2.6373584270477295, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5973393321037292, - "train/total_loss": 0.8475479483604431 + "train/classification_loss": 0.2191566675901413, + "train/contrastive_loss": 1.6404569149017334, + "train/negative_loss": 0.8151454925537109, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.8253113627433777, + "train/total_loss": 0.5472480654716492 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.17035207152366638, - "train/contrastive_loss": 2.6656641960144043, - "train/negative_loss": 1.4173641204833984, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.2483001947402954, - "train/total_loss": 0.7034848928451538 + "train/classification_loss": 0.16641321778297424, + "train/contrastive_loss": 3.6082730293273926, + "train/negative_loss": 3.6082630157470703, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 9.928638974088244e-06, + "train/total_loss": 0.8880678415298462 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12790991365909576, - "train/contrastive_loss": 1.187825083732605, - "train/negative_loss": 1.0027514696121216, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.1850736290216446, - "train/total_loss": 0.3654749393463135 + "train/classification_loss": 0.21078330278396606, + "train/contrastive_loss": 2.788423538208008, + "train/negative_loss": 0.8298013806343079, + "train/num_negatives": 46, + "train/num_positives": 8, + "train/positive_loss": 1.9586220979690552, + "train/total_loss": 0.7684680223464966 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.18845951557159424, - "train/contrastive_loss": 1.1508179903030396, - "train/negative_loss": 1.0606627464294434, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.0901552215218544, - "train/total_loss": 0.4186231195926666 + "train/classification_loss": 0.22494281828403473, + "train/contrastive_loss": 3.441727638244629, + "train/negative_loss": 2.8914742469787598, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.5502535104751587, + "train/total_loss": 0.9132883548736572 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.20356474816799164, - "train/contrastive_loss": 1.9221891164779663, - "train/negative_loss": 1.7523301839828491, - "train/num_negatives": 46, + "train/classification_loss": 0.2436332106590271, + "train/contrastive_loss": 0.7654647827148438, + "train/negative_loss": 0.2511307895183563, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.5143340229988098, + "train/total_loss": 0.39672619104385376 + }, + { + "epoch": 10.56338028169014, + "step": 3000, + "train/classification_loss": 0.29328644275665283, + "train/contrastive_loss": 4.5129265785217285, + "train/negative_loss": 1.815167784690857, + "train/num_negatives": 42, "train/num_positives": 8, - "train/positive_loss": 0.16985894739627838, - "train/total_loss": 0.5880025625228882 + "train/positive_loss": 2.697758674621582, + "train/total_loss": 1.1958718299865723 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1865595430135727, - "train/contrastive_loss": 2.1952462196350098, - "train/negative_loss": 2.1607000827789307, + "train/classification_loss": 0.18113462626934052, + "train/contrastive_loss": 2.5789456367492676, + "train/negative_loss": 1.396188497543335, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0345461331307888, - "train/total_loss": 0.6256088018417358 + "train/num_positives": 10, + "train/positive_loss": 1.182757019996643, + "train/total_loss": 0.6969237923622131 + }, + { + "epoch": 10.56338028169014, + "step": 3000, + "train/classification_loss": 0.1820196807384491, + "train/contrastive_loss": 1.809961199760437, + "train/negative_loss": 1.4282125234603882, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.38174864649772644, + "train/total_loss": 0.5440119504928589 + }, + { + "epoch": 10.56338028169014, + "step": 3000, + "train/classification_loss": 0.17479562759399414, + "train/contrastive_loss": 0.9607092142105103, + "train/negative_loss": 0.9605926275253296, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00011656926653813571, + "train/total_loss": 0.36693745851516724 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16585251688957214, - "train/contrastive_loss": 1.6458406448364258, - "train/negative_loss": 1.0878812074661255, + "train/classification_loss": 0.2636986970901489, + "train/contrastive_loss": 2.545609951019287, + "train/negative_loss": 1.4108635187149048, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.5579594969749451, - "train/total_loss": 0.49502065777778625 + "train/positive_loss": 1.1347464323043823, + "train/total_loss": 0.7728207111358643 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.17591886222362518, - "train/contrastive_loss": 2.5057668685913086, - "train/negative_loss": 1.8299767971038818, - "train/num_negatives": 36, + "train/classification_loss": 0.17134632170200348, + "train/contrastive_loss": 1.4071953296661377, + "train/negative_loss": 0.769248902797699, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.6379464864730835, + "train/total_loss": 0.4527853727340698 + }, + { + "epoch": 10.56338028169014, + "step": 3000, + "train/classification_loss": 0.3339294493198395, + "train/contrastive_loss": 2.163451671600342, + "train/negative_loss": 0.8712236881256104, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 0.6757900714874268, - "train/total_loss": 0.677072286605835 + "train/positive_loss": 1.292227864265442, + "train/total_loss": 0.7666198015213013 + }, + { + "epoch": 10.56338028169014, + "step": 3000, + "train/classification_loss": 0.13371475040912628, + "train/contrastive_loss": 2.418879985809326, + "train/negative_loss": 0.6593396067619324, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.759540319442749, + "train/total_loss": 0.6174907684326172 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.19505055248737335, - "train/contrastive_loss": 1.0013597011566162, - "train/negative_loss": 0.3520565629005432, + "train/classification_loss": 0.18897037208080292, + "train/contrastive_loss": 3.7722811698913574, + "train/negative_loss": 3.054877281188965, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.649303138256073, - "train/total_loss": 0.3953225016593933 + "train/num_positives": 14, + "train/positive_loss": 0.7174040079116821, + "train/total_loss": 0.9434266090393066 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.14135748147964478, - "train/contrastive_loss": 1.755215048789978, - "train/negative_loss": 0.7532435655593872, + "train/classification_loss": 0.2586095929145813, + "train/contrastive_loss": 2.0080924034118652, + "train/negative_loss": 2.008091449737549, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.0019714832305908, - "train/total_loss": 0.49240049719810486 + "train/num_positives": 2, + "train/positive_loss": 9.536747711536009e-07, + "train/total_loss": 0.6602280735969543 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1272624284029007, - "train/contrastive_loss": 1.2888516187667847, - "train/negative_loss": 0.7470607757568359, + "train/classification_loss": 0.19155491888523102, + "train/contrastive_loss": 2.808267831802368, + "train/negative_loss": 1.588202953338623, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5417908430099487, - "train/total_loss": 0.3850327730178833 + "train/num_positives": 16, + "train/positive_loss": 1.2200648784637451, + "train/total_loss": 0.7532084584236145 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2813057601451874, - "train/contrastive_loss": 2.190946340560913, - "train/negative_loss": 1.0955936908721924, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.0953526496887207, - "train/total_loss": 0.7194950580596924 + "train/classification_loss": 0.11223132163286209, + "train/contrastive_loss": 0.18879052996635437, + "train/negative_loss": 0.1261802464723587, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.06261028349399567, + "train/total_loss": 0.14998942613601685 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.10840906947851181, - "train/contrastive_loss": 0.8657689094543457, - "train/negative_loss": 0.8657673597335815, - "train/num_negatives": 48, + "train/classification_loss": 0.18023742735385895, + "train/contrastive_loss": 0.8828045129776001, + "train/negative_loss": 0.8595558404922485, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 1.549722128402209e-06, - "train/total_loss": 0.281562864780426 + "train/positive_loss": 0.023248683661222458, + "train/total_loss": 0.35679835081100464 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.11977273225784302, - "train/contrastive_loss": 0.825147271156311, - "train/negative_loss": 0.4187302887439728, + "train/classification_loss": 0.19564281404018402, + "train/contrastive_loss": 1.6861006021499634, + "train/negative_loss": 1.5358744859695435, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.40641701221466064, - "train/total_loss": 0.2848021984100342 + "train/num_positives": 14, + "train/positive_loss": 0.1502261459827423, + "train/total_loss": 0.5328629612922668 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.10419487953186035, - "train/contrastive_loss": 1.1158815622329712, - "train/negative_loss": 0.9900193810462952, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1258622258901596, - "train/total_loss": 0.32737118005752563 + "train/classification_loss": 0.30229437351226807, + "train/contrastive_loss": 2.5030159950256348, + "train/negative_loss": 1.3248379230499268, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.178178071975708, + "train/total_loss": 0.802897572517395 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.18383416533470154, - "train/contrastive_loss": 2.506121873855591, - "train/negative_loss": 2.3886687755584717, - "train/num_negatives": 28, + "train/classification_loss": 0.14517316222190857, + "train/contrastive_loss": 1.179174542427063, + "train/negative_loss": 1.0594836473464966, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.11745303869247437, - "train/total_loss": 0.68505859375 + "train/positive_loss": 0.11969085782766342, + "train/total_loss": 0.3810080885887146 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.14499320089817047, - "train/contrastive_loss": 1.7671196460723877, - "train/negative_loss": 0.5339397192001343, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2331799268722534, - "train/total_loss": 0.4984171390533447 + "train/classification_loss": 0.13750970363616943, + "train/contrastive_loss": 0.7566724419593811, + "train/negative_loss": 0.3975960314273834, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.3590764105319977, + "train/total_loss": 0.28884419798851013 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.15418565273284912, - "train/contrastive_loss": 0.8312177658081055, - "train/negative_loss": 0.3118648827075958, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5193528532981873, - "train/total_loss": 0.3204292058944702 + "train/classification_loss": 0.16646422445774078, + "train/contrastive_loss": 2.040703773498535, + "train/negative_loss": 1.0129212141036987, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0277825593948364, + "train/total_loss": 0.5746049880981445 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16117538511753082, - "train/contrastive_loss": 1.2060853242874146, - "train/negative_loss": 0.6577202677726746, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.54836505651474, - "train/total_loss": 0.4023924469947815 + "train/classification_loss": 0.20582664012908936, + "train/contrastive_loss": 4.210188388824463, + "train/negative_loss": 1.2171884775161743, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 2.993000030517578, + "train/total_loss": 1.047864317893982 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.23695331811904907, - "train/contrastive_loss": 3.3306233882904053, - "train/negative_loss": 2.585937976837158, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7446854710578918, - "train/total_loss": 0.903078019618988 + "train/classification_loss": 0.19206711649894714, + "train/contrastive_loss": 1.3858373165130615, + "train/negative_loss": 0.7494128346443176, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.6364244818687439, + "train/total_loss": 0.4692345857620239 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.15182018280029297, - "train/contrastive_loss": 1.1750937700271606, - "train/negative_loss": 0.4060361087322235, + "train/classification_loss": 0.10709568113088608, + "train/contrastive_loss": 0.725210964679718, + "train/negative_loss": 0.7208110690116882, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.7690576910972595, - "train/total_loss": 0.3868389427661896 + "train/num_positives": 16, + "train/positive_loss": 0.004399867728352547, + "train/total_loss": 0.2521378695964813 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.1742718368768692, - "train/contrastive_loss": 2.8512275218963623, - "train/negative_loss": 1.819934606552124, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0312929153442383, - "train/total_loss": 0.7445173263549805 + "train/classification_loss": 0.1921747773885727, + "train/contrastive_loss": 2.197178840637207, + "train/negative_loss": 1.372187614440918, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.8249912261962891, + "train/total_loss": 0.6316105723381042 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.26590824127197266, - "train/contrastive_loss": 3.6876583099365234, - "train/negative_loss": 1.4186726808547974, + "train/classification_loss": 0.23746086657047272, + "train/contrastive_loss": 1.5042730569839478, + "train/negative_loss": 1.3201839923858643, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.2689857482910156, - "train/total_loss": 1.0034399032592773 + "train/num_positives": 2, + "train/positive_loss": 0.18408910930156708, + "train/total_loss": 0.53831547498703 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.20893029868602753, - "train/contrastive_loss": 2.9733974933624268, - "train/negative_loss": 1.536466360092163, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4369311332702637, - "train/total_loss": 0.8036098480224609 + "train/classification_loss": 0.15973779559135437, + "train/contrastive_loss": 2.2139954566955566, + "train/negative_loss": 1.3080657720565796, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.9059298038482666, + "train/total_loss": 0.6025369167327881 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.18405790627002716, - "train/contrastive_loss": 2.6884098052978516, - "train/negative_loss": 2.1735570430755615, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5148528218269348, - "train/total_loss": 0.7217398881912231 + "train/classification_loss": 0.18993617594242096, + "train/contrastive_loss": 1.3275916576385498, + "train/negative_loss": 0.9583486914634705, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.36924299597740173, + "train/total_loss": 0.4554545283317566 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.24799588322639465, - "train/contrastive_loss": 4.17476749420166, - "train/negative_loss": 1.8092999458312988, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.3654677867889404, - "train/total_loss": 1.0829493999481201 + "train/classification_loss": 0.17862918972969055, + "train/contrastive_loss": 2.797597885131836, + "train/negative_loss": 0.7121429443359375, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 2.0854549407958984, + "train/total_loss": 0.7381488084793091 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2283252328634262, - "train/contrastive_loss": 4.305217742919922, - "train/negative_loss": 3.3206844329833984, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9845334887504578, - "train/total_loss": 1.0893688201904297 + "train/classification_loss": 0.14451172947883606, + "train/contrastive_loss": 3.5993711948394775, + "train/negative_loss": 3.5993692874908447, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.835825969465077e-06, + "train/total_loss": 0.8643859624862671 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.2991081178188324, - "train/contrastive_loss": 3.4270687103271484, - "train/negative_loss": 1.6912280321121216, + "train/classification_loss": 0.15485413372516632, + "train/contrastive_loss": 0.5619473457336426, + "train/negative_loss": 0.354228138923645, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.7358406782150269, - "train/total_loss": 0.9845218658447266 + "train/positive_loss": 0.20771919190883636, + "train/total_loss": 0.2672435939311981 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16825774312019348, - "train/contrastive_loss": 0.8527832627296448, - "train/negative_loss": 0.7120317816734314, + "train/classification_loss": 0.20139886438846588, + "train/contrastive_loss": 2.9238600730895996, + "train/negative_loss": 1.357291579246521, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.14075146615505219, - "train/total_loss": 0.338814377784729 + "train/num_positives": 8, + "train/positive_loss": 1.566568374633789, + "train/total_loss": 0.7861708998680115 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.16019345819950104, - "train/contrastive_loss": 1.8533010482788086, - "train/negative_loss": 1.1728296279907227, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6804713606834412, - "train/total_loss": 0.5308536887168884 + "train/classification_loss": 0.1958179622888565, + "train/contrastive_loss": 2.95369553565979, + "train/negative_loss": 1.2270042896270752, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.7266912460327148, + "train/total_loss": 0.7865570783615112 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.11453720927238464, - "train/contrastive_loss": 0.9892170429229736, - "train/negative_loss": 0.304633766412735, - "train/num_negatives": 46, + "train/classification_loss": 0.25784116983413696, + "train/contrastive_loss": 2.2676851749420166, + "train/negative_loss": 1.1066980361938477, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.684583306312561, - "train/total_loss": 0.3123806118965149 + "train/positive_loss": 1.160987138748169, + "train/total_loss": 0.7113782167434692 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.20270280539989471, - "train/contrastive_loss": 1.857444405555725, - "train/negative_loss": 1.857444405555725, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.574191689491272 - }, - { - "epoch": 11.406844106463879, - "eval_exact_match_accuracy": 0.3180952380952381, - "eval_hamming_loss": 0.06532212885154062, - "eval_loss": 0.5655184984207153, - "eval_macro_f1": 0.3593068317626967, - "eval_macro_precision": 0.5906339711138869, - "eval_macro_recall": 0.29020490228113227, - "eval_micro_f1": 0.5832737669764118, - "eval_micro_precision": 0.7846153846153846, - "eval_micro_recall": 0.4641638225255973, - "eval_runtime": 2.6268, - "eval_samples_per_second": 199.859, - "eval_steps_per_second": 25.125, + "train/classification_loss": 0.16992880403995514, + "train/contrastive_loss": 0.767574667930603, + "train/negative_loss": 0.7672322988510132, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.0003423854650463909, + "train/total_loss": 0.323443740606308 + }, + { + "epoch": 10.56338028169014, + "eval_exact_match_accuracy": 0.30687830687830686, + "eval_hamming_loss": 0.06867932358128437, + "eval_loss": 0.6113051176071167, + "eval_macro_f1": 0.39493366640337385, + "eval_macro_precision": 0.6247004748047559, + "eval_macro_recall": 0.31731720981631967, + "eval_micro_f1": 0.5520974289580515, + "eval_micro_precision": 0.7555555555555555, + "eval_micro_recall": 0.4349680170575693, + "eval_runtime": 2.8624, + "eval_samples_per_second": 198.085, + "eval_steps_per_second": 24.804, "step": 3000 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.12474408000707626, - "train/contrastive_loss": 0.4539308547973633, - "train/negative_loss": 0.45362919569015503, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.0003016649279743433, - "train/total_loss": 0.21553024649620056 + "train/classification_loss": 0.13586701452732086, + "train/contrastive_loss": 0.9734164476394653, + "train/negative_loss": 0.7267447710037231, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 0.2466716766357422, + "train/total_loss": 0.33055031299591064 }, { - "epoch": 11.406844106463879, + "epoch": 10.56338028169014, "step": 3000, - "train/classification_loss": 0.13093146681785583, - "train/contrastive_loss": 0.6874858736991882, - "train/negative_loss": 0.29949474334716797, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.38799113035202026, - "train/total_loss": 0.26842862367630005 + "train/classification_loss": 0.22636692225933075, + "train/contrastive_loss": 1.1001310348510742, + "train/negative_loss": 0.4253845810890198, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.6747464537620544, + "train/total_loss": 0.44639313220977783 }, { - "epoch": 11.596958174904943, - "grad_norm": 5.855732440948486, - "learning_rate": 1.9551445966514463e-05, - "loss": 0.553, + "epoch": 10.73943661971831, + "grad_norm": 8.174198150634766, + "learning_rate": 1.958477801268499e-05, + "loss": 0.6474, "step": 3050 }, { - "epoch": 11.596958174904943, + "epoch": 10.73943661971831, "step": 3050, - "train/classification_loss": 0.11329378932714462, - "train/contrastive_loss": 0.26736801862716675, - "train/negative_loss": 0.26733070611953735, - "train/num_negatives": 40, - "train/num_positives": 6, - "train/positive_loss": 3.731324977707118e-05, - "train/total_loss": 0.16676738858222961 + "train/classification_loss": 0.09077351540327072, + "train/contrastive_loss": 1.7142343521118164, + "train/negative_loss": 1.6784005165100098, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.03583380579948425, + "train/total_loss": 0.4336203932762146 }, { - "epoch": 11.596958174904943, + "epoch": 10.73943661971831, "step": 3050, - "train/classification_loss": 0.09523150324821472, - "train/contrastive_loss": 0.2954108417034149, - "train/negative_loss": 0.29532548785209656, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 8.534462540410459e-05, - "train/total_loss": 0.15431366860866547 + "train/classification_loss": 0.17790691554546356, + "train/contrastive_loss": 0.7195115089416504, + "train/negative_loss": 0.2735605835914612, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 0.4459509253501892, + "train/total_loss": 0.32180923223495483 }, { - "epoch": 11.787072243346007, - "grad_norm": 14.080097198486328, - "learning_rate": 1.9543835616438358e-05, - "loss": 0.5457, + "epoch": 10.915492957746478, + "grad_norm": 22.022693634033203, + "learning_rate": 1.957773079633545e-05, + "loss": 0.5927, "step": 3100 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.30850985646247864, - "train/contrastive_loss": 2.438037157058716, - "train/negative_loss": 1.8319498300552368, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.6060873866081238, - "train/total_loss": 0.7961173057556152 + "train/classification_loss": 0.2864118814468384, + "train/contrastive_loss": 1.887838363647461, + "train/negative_loss": 1.645249605178833, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.24258872866630554, + "train/total_loss": 0.6639795303344727 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.17118917405605316, - "train/contrastive_loss": 1.8063771724700928, - "train/negative_loss": 1.326668381690979, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.47970882058143616, - "train/total_loss": 0.5324646234512329 + "train/classification_loss": 0.24336405098438263, + "train/contrastive_loss": 1.0732638835906982, + "train/negative_loss": 0.5296627283096313, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5436012148857117, + "train/total_loss": 0.4580168128013611 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1661079227924347, - "train/contrastive_loss": 1.290942907333374, - "train/negative_loss": 0.4647131860256195, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8262297511100769, - "train/total_loss": 0.424296498298645 + "train/classification_loss": 0.24337171018123627, + "train/contrastive_loss": 3.356455087661743, + "train/negative_loss": 1.7600804567337036, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.5963746309280396, + "train/total_loss": 0.914662778377533 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.23913997411727905, - "train/contrastive_loss": 2.6735897064208984, - "train/negative_loss": 1.486357569694519, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.1872321367263794, - "train/total_loss": 0.7738579511642456 + "train/classification_loss": 0.18461358547210693, + "train/contrastive_loss": 3.4242005348205566, + "train/negative_loss": 2.0972795486450195, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.3269211053848267, + "train/total_loss": 0.8694537281990051 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.11367961764335632, - "train/contrastive_loss": 1.6446164846420288, - "train/negative_loss": 1.217618703842163, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.4269977807998657, - "train/total_loss": 0.4426029324531555 + "train/classification_loss": 0.1745333969593048, + "train/contrastive_loss": 2.0744104385375977, + "train/negative_loss": 1.5164457559585571, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.5579646229743958, + "train/total_loss": 0.5894154906272888 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1782500147819519, - "train/contrastive_loss": 1.765442132949829, - "train/negative_loss": 1.1532024145126343, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.6122397184371948, - "train/total_loss": 0.5313384532928467 + "train/classification_loss": 0.2251957356929779, + "train/contrastive_loss": 2.4608092308044434, + "train/negative_loss": 1.6046676635742188, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8561415076255798, + "train/total_loss": 0.7173575758934021 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.24368718266487122, - "train/contrastive_loss": 2.4556100368499756, - "train/negative_loss": 1.1317987442016602, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.3238112926483154, - "train/total_loss": 0.734809160232544 + "train/classification_loss": 0.18051719665527344, + "train/contrastive_loss": 1.5304803848266602, + "train/negative_loss": 0.7692257761955261, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.761254608631134, + "train/total_loss": 0.48661327362060547 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1527947187423706, - "train/contrastive_loss": 1.4951581954956055, - "train/negative_loss": 0.930124819278717, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5650333762168884, - "train/total_loss": 0.4518263638019562 + "train/classification_loss": 0.16268013417720795, + "train/contrastive_loss": 0.45500245690345764, + "train/negative_loss": 0.4549833834171295, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 1.9073668227065355e-05, + "train/total_loss": 0.25368061661720276 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1275285929441452, - "train/contrastive_loss": 0.7532818913459778, - "train/negative_loss": 0.7374222874641418, + "train/classification_loss": 0.1237364113330841, + "train/contrastive_loss": 2.254930257797241, + "train/negative_loss": 0.9909666776657104, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.015859588980674744, - "train/total_loss": 0.2781849801540375 + "train/positive_loss": 1.2639635801315308, + "train/total_loss": 0.5747224688529968 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.34821832180023193, - "train/contrastive_loss": 2.8812687397003174, - "train/negative_loss": 1.5116010904312134, + "train/classification_loss": 0.16575469076633453, + "train/contrastive_loss": 1.8757065534591675, + "train/negative_loss": 1.4117900133132935, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.369667649269104, - "train/total_loss": 0.9244720935821533 + "train/num_positives": 14, + "train/positive_loss": 0.463916540145874, + "train/total_loss": 0.5408959984779358 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.19269056618213654, - "train/contrastive_loss": 2.7230725288391113, - "train/negative_loss": 1.6545416116714478, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.0685310363769531, - "train/total_loss": 0.7373050451278687 + "train/classification_loss": 0.13043059408664703, + "train/contrastive_loss": 1.236993432044983, + "train/negative_loss": 0.379549115896225, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.8574442863464355, + "train/total_loss": 0.37782928347587585 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.11435721069574356, - "train/contrastive_loss": 1.3678646087646484, - "train/negative_loss": 0.3516920208930969, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.0161726474761963, - "train/total_loss": 0.38793012499809265 + "train/classification_loss": 0.17029546201229095, + "train/contrastive_loss": 2.510523796081543, + "train/negative_loss": 1.636656403541565, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8738675117492676, + "train/total_loss": 0.6724002361297607 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16035668551921844, - "train/contrastive_loss": 2.078024387359619, - "train/negative_loss": 1.8627076148986816, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.21531686186790466, - "train/total_loss": 0.5759615898132324 + "train/classification_loss": 0.21521975100040436, + "train/contrastive_loss": 3.4830446243286133, + "train/negative_loss": 1.8847639560699463, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.598280668258667, + "train/total_loss": 0.9118286967277527 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.12188967317342758, - "train/contrastive_loss": 2.0551159381866455, - "train/negative_loss": 2.05480694770813, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0003088944358751178, - "train/total_loss": 0.5329128503799438 + "train/classification_loss": 0.15509048104286194, + "train/contrastive_loss": 1.3517342805862427, + "train/negative_loss": 0.742401659488678, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.6093326210975647, + "train/total_loss": 0.425437331199646 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.10308941453695297, - "train/contrastive_loss": 1.3137239217758179, - "train/negative_loss": 0.7169795036315918, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5967444181442261, - "train/total_loss": 0.36583420634269714 + "train/classification_loss": 0.12977679073810577, + "train/contrastive_loss": 2.0522046089172363, + "train/negative_loss": 0.5493854880332947, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.5028190612792969, + "train/total_loss": 0.5402176976203918 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.11910144239664078, - "train/contrastive_loss": 0.7604823112487793, - "train/negative_loss": 0.45046234130859375, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.31001994013786316, - "train/total_loss": 0.2711979150772095 + "train/classification_loss": 0.16477005183696747, + "train/contrastive_loss": 1.2424614429473877, + "train/negative_loss": 0.30191347002983093, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.9405479431152344, + "train/total_loss": 0.41326233744621277 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.23285993933677673, - "train/contrastive_loss": 2.1962900161743164, - "train/negative_loss": 1.0654946565628052, - "train/num_negatives": 40, + "train/classification_loss": 0.1339196115732193, + "train/contrastive_loss": 1.1581369638442993, + "train/negative_loss": 0.12770843505859375, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.1307953596115112, - "train/total_loss": 0.6721179485321045 + "train/positive_loss": 1.0304285287857056, + "train/total_loss": 0.3655470013618469 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1814068853855133, - "train/contrastive_loss": 1.9178614616394043, - "train/negative_loss": 0.9271084070205688, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.9907531142234802, - "train/total_loss": 0.5649791955947876 + "train/classification_loss": 0.19022709131240845, + "train/contrastive_loss": 1.423992395401001, + "train/negative_loss": 0.4855671226978302, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.9384252429008484, + "train/total_loss": 0.47502556443214417 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.18418172001838684, - "train/contrastive_loss": 1.5422708988189697, - "train/negative_loss": 1.5323821306228638, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.0098887262865901, - "train/total_loss": 0.49263590574264526 + "train/classification_loss": 0.1645231544971466, + "train/contrastive_loss": 1.8002641201019287, + "train/negative_loss": 0.862368106842041, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.9378959536552429, + "train/total_loss": 0.52457594871521 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.14255692064762115, - "train/contrastive_loss": 2.0502266883850098, - "train/negative_loss": 1.0674811601638794, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9827456474304199, - "train/total_loss": 0.5526022911071777 + "train/classification_loss": 0.20813487470149994, + "train/contrastive_loss": 3.664506673812866, + "train/negative_loss": 1.383126974105835, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.2813796997070312, + "train/total_loss": 0.9410362243652344 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1906108260154724, - "train/contrastive_loss": 1.4210673570632935, - "train/negative_loss": 0.3878963887691498, - "train/num_negatives": 44, + "train/classification_loss": 0.11586124449968338, + "train/contrastive_loss": 1.495785117149353, + "train/negative_loss": 1.4938901662826538, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.0331709384918213, - "train/total_loss": 0.47482430934906006 + "train/positive_loss": 0.00189495540689677, + "train/total_loss": 0.4150182604789734 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.23364029824733734, - "train/contrastive_loss": 1.964447259902954, - "train/negative_loss": 1.0934561491012573, - "train/num_negatives": 44, + "train/classification_loss": 0.11913207173347473, + "train/contrastive_loss": 2.461695909500122, + "train/negative_loss": 1.6116716861724854, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.8709911108016968, - "train/total_loss": 0.6265297532081604 + "train/positive_loss": 0.8500242233276367, + "train/total_loss": 0.6114712953567505 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.14438021183013916, - "train/contrastive_loss": 1.5457876920700073, - "train/negative_loss": 0.4354158639907837, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.1103718280792236, - "train/total_loss": 0.4535377621650696 + "train/classification_loss": 0.16245511174201965, + "train/contrastive_loss": 2.0862247943878174, + "train/negative_loss": 2.040592670440674, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.04563206061720848, + "train/total_loss": 0.5797001123428345 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.14111614227294922, - "train/contrastive_loss": 1.1998090744018555, - "train/negative_loss": 0.21785691380500793, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.9819521903991699, - "train/total_loss": 0.38107794523239136 + "train/classification_loss": 0.28559696674346924, + "train/contrastive_loss": 2.0909156799316406, + "train/negative_loss": 1.271106243133545, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.8198093175888062, + "train/total_loss": 0.7037801146507263 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.10276228189468384, - "train/contrastive_loss": 1.4988818168640137, - "train/negative_loss": 0.46438688039779663, + "train/classification_loss": 0.1815870702266693, + "train/contrastive_loss": 2.731168031692505, + "train/negative_loss": 0.738377034664154, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.0344949960708618, - "train/total_loss": 0.4025386571884155 + "train/num_positives": 10, + "train/positive_loss": 1.9927910566329956, + "train/total_loss": 0.727820634841919 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2761395275592804, - "train/contrastive_loss": 1.7263723611831665, - "train/negative_loss": 0.34429416060447693, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3820781707763672, - "train/total_loss": 0.6214140057563782 + "train/classification_loss": 0.19949638843536377, + "train/contrastive_loss": 2.3821473121643066, + "train/negative_loss": 1.4946497678756714, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8874974846839905, + "train/total_loss": 0.6759258508682251 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2570796310901642, - "train/contrastive_loss": 3.2612366676330566, - "train/negative_loss": 1.5015274286270142, + "train/classification_loss": 0.18911835551261902, + "train/contrastive_loss": 3.349832534790039, + "train/negative_loss": 1.8693777322769165, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.759709358215332, - "train/total_loss": 0.9093270301818848 + "train/num_positives": 4, + "train/positive_loss": 1.480454921722412, + "train/total_loss": 0.8590848445892334 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1660730093717575, - "train/contrastive_loss": 3.4777040481567383, - "train/negative_loss": 2.6118478775024414, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.8658562898635864, - "train/total_loss": 0.8616138696670532 + "train/classification_loss": 0.17546650767326355, + "train/contrastive_loss": 0.23197080194950104, + "train/negative_loss": 0.16607673466205597, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.06589406728744507, + "train/total_loss": 0.22186067700386047 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.19621846079826355, - "train/contrastive_loss": 1.3405632972717285, - "train/negative_loss": 0.6862110495567322, - "train/num_negatives": 40, + "train/classification_loss": 0.2607475817203522, + "train/contrastive_loss": 2.7584080696105957, + "train/negative_loss": 1.547375202178955, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6543523073196411, - "train/total_loss": 0.46433112025260925 - }, - { - "epoch": 11.787072243346007, - "step": 3100, - "train/classification_loss": 0.20874522626399994, - "train/contrastive_loss": 0.9922718405723572, - "train/negative_loss": 0.9497359395027161, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.042535919696092606, - "train/total_loss": 0.40719959139823914 - }, - { - "epoch": 11.787072243346007, - "step": 3100, - "train/classification_loss": 0.1417238712310791, - "train/contrastive_loss": 2.4431538581848145, - "train/negative_loss": 1.2108582258224487, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.2322955131530762, - "train/total_loss": 0.630354642868042 + "train/positive_loss": 1.211032748222351, + "train/total_loss": 0.8124291896820068 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.22046470642089844, - "train/contrastive_loss": 2.305354118347168, - "train/negative_loss": 1.326872706413269, + "train/classification_loss": 0.18682272732257843, + "train/contrastive_loss": 0.9725147485733032, + "train/negative_loss": 0.9686235189437866, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9784815311431885, - "train/total_loss": 0.681535542011261 + "train/num_positives": 10, + "train/positive_loss": 0.0038912203162908554, + "train/total_loss": 0.3813256621360779 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2712894082069397, - "train/contrastive_loss": 1.3946226835250854, - "train/negative_loss": 1.3942121267318726, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00041058147326111794, - "train/total_loss": 0.5502139329910278 + "train/classification_loss": 0.15884801745414734, + "train/contrastive_loss": 1.14173424243927, + "train/negative_loss": 1.0859134197235107, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.05582084506750107, + "train/total_loss": 0.3871948719024658 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.19949695467948914, - "train/contrastive_loss": 0.84244704246521, - "train/negative_loss": 0.4347458779811859, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.40770119428634644, - "train/total_loss": 0.36798638105392456 + "train/classification_loss": 0.1540917456150055, + "train/contrastive_loss": 1.5852687358856201, + "train/negative_loss": 1.068734884262085, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5165338516235352, + "train/total_loss": 0.47114551067352295 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.19579117000102997, - "train/contrastive_loss": 2.9402761459350586, - "train/negative_loss": 2.3121609687805176, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.6281151175498962, - "train/total_loss": 0.7838464379310608 + "train/classification_loss": 0.18662399053573608, + "train/contrastive_loss": 1.9513202905654907, + "train/negative_loss": 1.1811792850494385, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7701410055160522, + "train/total_loss": 0.5768880844116211 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.17434538900852203, - "train/contrastive_loss": 2.8224329948425293, - "train/negative_loss": 1.4390313625335693, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.3834015130996704, - "train/total_loss": 0.7388319969177246 + "train/classification_loss": 0.21067319810390472, + "train/contrastive_loss": 2.445605754852295, + "train/negative_loss": 1.8993991613388062, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.5462064743041992, + "train/total_loss": 0.699794352054596 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16889899969100952, - "train/contrastive_loss": 2.1365671157836914, - "train/negative_loss": 1.6418653726577759, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.49470168352127075, - "train/total_loss": 0.5962123870849609 + "train/classification_loss": 0.21469761431217194, + "train/contrastive_loss": 2.5030813217163086, + "train/negative_loss": 1.2699363231658936, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.2331451177597046, + "train/total_loss": 0.7153138518333435 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1681680977344513, - "train/contrastive_loss": 0.7774358987808228, - "train/negative_loss": 0.7774287462234497, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 7.152582838898525e-06, - "train/total_loss": 0.32365527749061584 + "train/classification_loss": 0.13888822495937347, + "train/contrastive_loss": 1.0031150579452515, + "train/negative_loss": 0.9300569891929626, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.07305808365345001, + "train/total_loss": 0.3395112454891205 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.19506977498531342, - "train/contrastive_loss": 1.4856916666030884, - "train/negative_loss": 1.4739717245101929, + "train/classification_loss": 0.18932612240314484, + "train/contrastive_loss": 2.515317440032959, + "train/negative_loss": 0.7715743780136108, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.011719942092895508, - "train/total_loss": 0.4922081232070923 + "train/positive_loss": 1.7437431812286377, + "train/total_loss": 0.6923896074295044 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.18655599653720856, - "train/contrastive_loss": 2.1325838565826416, - "train/negative_loss": 2.120394468307495, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.012189408764243126, - "train/total_loss": 0.6130727529525757 + "train/classification_loss": 0.23474206030368805, + "train/contrastive_loss": 2.8058667182922363, + "train/negative_loss": 2.665243148803711, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.14062350988388062, + "train/total_loss": 0.795915424823761 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.15362490713596344, - "train/contrastive_loss": 0.7722576260566711, - "train/negative_loss": 0.7455851435661316, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.026672495529055595, - "train/total_loss": 0.3080764412879944 + "train/classification_loss": 0.2089659720659256, + "train/contrastive_loss": 1.217363715171814, + "train/negative_loss": 0.5548285841941833, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.6625351309776306, + "train/total_loss": 0.45243871212005615 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.18498140573501587, - "train/contrastive_loss": 2.203679084777832, - "train/negative_loss": 1.4016309976577759, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.8020479679107666, - "train/total_loss": 0.6257172226905823 + "train/classification_loss": 0.2850220501422882, + "train/contrastive_loss": 4.733141899108887, + "train/negative_loss": 2.235766887664795, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 2.497375011444092, + "train/total_loss": 1.231650471687317 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.13214343786239624, + "train/contrastive_loss": 0.8666453957557678, + "train/negative_loss": 0.6629396677017212, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.20370574295520782, + "train/total_loss": 0.3054725229740143 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.206832155585289, - "train/contrastive_loss": 0.7932976484298706, - "train/negative_loss": 0.1437096893787384, + "train/classification_loss": 0.1611281782388687, + "train/contrastive_loss": 1.518791913986206, + "train/negative_loss": 1.1376475095748901, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.6495879292488098, - "train/total_loss": 0.36549168825149536 + "train/num_positives": 14, + "train/positive_loss": 0.3811444342136383, + "train/total_loss": 0.46488654613494873 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.13265672326087952, - "train/contrastive_loss": 1.7116001844406128, - "train/negative_loss": 0.7400783896446228, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.97152179479599, - "train/total_loss": 0.4749767780303955 + "train/classification_loss": 0.15202417969703674, + "train/contrastive_loss": 0.5903093218803406, + "train/negative_loss": 0.5901009440422058, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.00020837149349972606, + "train/total_loss": 0.27008605003356934 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.238716259598732, + "train/contrastive_loss": 0.6789034605026245, + "train/negative_loss": 0.6504549980163574, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.02844846621155739, + "train/total_loss": 0.3744969367980957 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.13616080582141876, - "train/contrastive_loss": 0.7258492708206177, - "train/negative_loss": 0.3014896512031555, + "train/classification_loss": 0.15262065827846527, + "train/contrastive_loss": 0.8248007893562317, + "train/negative_loss": 0.7848192453384399, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.42435961961746216, - "train/total_loss": 0.2813306450843811 + "train/num_positives": 12, + "train/positive_loss": 0.03998157009482384, + "train/total_loss": 0.31758081912994385 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.25409799814224243, - "train/contrastive_loss": 1.2719230651855469, - "train/negative_loss": 0.6375426054000854, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.6343804597854614, - "train/total_loss": 0.5084825754165649 + "train/classification_loss": 0.33645617961883545, + "train/contrastive_loss": 2.646329402923584, + "train/negative_loss": 1.732357144355774, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 0.9139721393585205, + "train/total_loss": 0.8657220602035522 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.13383379578590393, + "train/contrastive_loss": 2.0540456771850586, + "train/negative_loss": 1.0507713556289673, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.0032742023468018, + "train/total_loss": 0.5446429252624512 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.17278072237968445, + "train/contrastive_loss": 1.8779497146606445, + "train/negative_loss": 1.5615594387054443, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.31639033555984497, + "train/total_loss": 0.5483706593513489 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.10711669921875, - "train/contrastive_loss": 0.6025230884552002, - "train/negative_loss": 0.6025198698043823, + "train/classification_loss": 0.303207665681839, + "train/contrastive_loss": 2.935037612915039, + "train/negative_loss": 2.9350357055664062, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 3.218658548576059e-06, - "train/total_loss": 0.22762131690979004 + "train/num_positives": 2, + "train/positive_loss": 1.7881409348774469e-06, + "train/total_loss": 0.8902151584625244 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.14392776787281036, - "train/contrastive_loss": 1.289807677268982, - "train/negative_loss": 0.9559339284896851, - "train/num_negatives": 38, + "train/classification_loss": 0.21228420734405518, + "train/contrastive_loss": 2.569387435913086, + "train/negative_loss": 1.3032070398330688, + "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.3338737487792969, - "train/total_loss": 0.4018893241882324 + "train/positive_loss": 1.2661805152893066, + "train/total_loss": 0.7261617183685303 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.08772045373916626, - "train/contrastive_loss": 0.9549421072006226, - "train/negative_loss": 0.7380021810531616, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.21693992614746094, - "train/total_loss": 0.27870887517929077 + "train/classification_loss": 0.12310808151960373, + "train/contrastive_loss": 0.2326999306678772, + "train/negative_loss": 0.07561866194009781, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.1570812612771988, + "train/total_loss": 0.16964806616306305 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16894616186618805, - "train/contrastive_loss": 1.448263168334961, - "train/negative_loss": 0.8016389012336731, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.6466242074966431, - "train/total_loss": 0.458598792552948 + "train/classification_loss": 0.21158453822135925, + "train/contrastive_loss": 1.064109444618225, + "train/negative_loss": 1.003908395767212, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.06020107865333557, + "train/total_loss": 0.42440640926361084 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1489696204662323, - "train/contrastive_loss": 2.3309006690979004, - "train/negative_loss": 0.7391207218170166, - "train/num_negatives": 42, + "train/classification_loss": 0.18313325941562653, + "train/contrastive_loss": 1.17430579662323, + "train/negative_loss": 0.9207723736763, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 1.5917800664901733, - "train/total_loss": 0.615149736404419 + "train/positive_loss": 0.25353342294692993, + "train/total_loss": 0.4179944396018982 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16260375082492828, - "train/contrastive_loss": 0.9085520505905151, - "train/negative_loss": 0.6483113169670105, - "train/num_negatives": 50, + "train/classification_loss": 0.3142702877521515, + "train/contrastive_loss": 4.130368232727051, + "train/negative_loss": 1.5191065073013306, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 0.260240763425827, - "train/total_loss": 0.3443141579627991 + "train/positive_loss": 2.6112618446350098, + "train/total_loss": 1.1403439044952393 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.18239237368106842, - "train/contrastive_loss": 1.765061855316162, - "train/negative_loss": 1.081243634223938, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6838182806968689, - "train/total_loss": 0.5354047417640686 + "train/classification_loss": 0.1566716879606247, + "train/contrastive_loss": 1.673736333847046, + "train/negative_loss": 0.4677121937274933, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.206024169921875, + "train/total_loss": 0.4914189577102661 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2420712113380432, - "train/contrastive_loss": 3.3655848503112793, - "train/negative_loss": 2.474825143814087, + "train/classification_loss": 0.12629804015159607, + "train/contrastive_loss": 0.620015025138855, + "train/negative_loss": 0.36873212456703186, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.8907598257064819, - "train/total_loss": 0.915188193321228 + "train/positive_loss": 0.2512829005718231, + "train/total_loss": 0.2503010630607605 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.14527374505996704, + "train/contrastive_loss": 0.9354717135429382, + "train/negative_loss": 0.612289309501648, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.3231824040412903, + "train/total_loss": 0.33236807584762573 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.2021377980709076, + "train/contrastive_loss": 2.8250555992126465, + "train/negative_loss": 1.6179020404815674, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.207153558731079, + "train/total_loss": 0.7671489715576172 + }, + { + "epoch": 10.915492957746478, + "step": 3100, + "train/classification_loss": 0.19269733130931854, + "train/contrastive_loss": 0.7300717830657959, + "train/negative_loss": 0.20723435282707214, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.5228374004364014, + "train/total_loss": 0.338711678981781 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.15796855092048645, - "train/contrastive_loss": 1.1215510368347168, - "train/negative_loss": 0.39289674162864685, + "train/classification_loss": 0.08335969597101212, + "train/contrastive_loss": 0.19011488556861877, + "train/negative_loss": 0.16568341851234436, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.7286542654037476, - "train/total_loss": 0.3822787404060364 + "train/num_positives": 16, + "train/positive_loss": 0.024431472644209862, + "train/total_loss": 0.12138266861438751 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1589052528142929, - "train/contrastive_loss": 2.341857433319092, - "train/negative_loss": 1.294974684715271, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0468827486038208, - "train/total_loss": 0.6272767186164856 + "train/classification_loss": 0.20223596692085266, + "train/contrastive_loss": 2.590609073638916, + "train/negative_loss": 1.370938777923584, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 1.2196701765060425, + "train/total_loss": 0.7203577756881714 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.26075443625450134, - "train/contrastive_loss": 3.2908811569213867, - "train/negative_loss": 1.2616039514541626, + "train/classification_loss": 0.1792982667684555, + "train/contrastive_loss": 0.8562071323394775, + "train/negative_loss": 0.8168087005615234, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.0292773246765137, - "train/total_loss": 0.9189306497573853 + "train/num_positives": 2, + "train/positive_loss": 0.03939841687679291, + "train/total_loss": 0.3505396842956543 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.23480775952339172, - "train/contrastive_loss": 3.614955425262451, - "train/negative_loss": 1.7329511642456055, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8820041418075562, - "train/total_loss": 0.9577988386154175 + "train/classification_loss": 0.13246937096118927, + "train/contrastive_loss": 1.981392502784729, + "train/negative_loss": 0.9428377151489258, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0385547876358032, + "train/total_loss": 0.5287478566169739 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16407369077205658, - "train/contrastive_loss": 1.9473087787628174, - "train/negative_loss": 1.3644864559173584, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5828223824501038, - "train/total_loss": 0.5535354614257812 + "train/classification_loss": 0.20984430611133575, + "train/contrastive_loss": 2.0217764377593994, + "train/negative_loss": 0.9913319945335388, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.0304443836212158, + "train/total_loss": 0.6141995787620544 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2329026162624359, - "train/contrastive_loss": 4.000485420227051, - "train/negative_loss": 1.586257815361023, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.4142274856567383, - "train/total_loss": 1.0329997539520264 + "train/classification_loss": 0.1769595444202423, + "train/contrastive_loss": 2.7295522689819336, + "train/negative_loss": 0.8510855436325073, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.8784666061401367, + "train/total_loss": 0.7228699922561646 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.24381662905216217, - "train/contrastive_loss": 4.903266906738281, - "train/negative_loss": 3.4803836345672607, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.422883152961731, - "train/total_loss": 1.2244700193405151 + "train/classification_loss": 0.13547709584236145, + "train/contrastive_loss": 2.775662660598755, + "train/negative_loss": 2.7756612300872803, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 1.370908194076037e-06, + "train/total_loss": 0.6906096935272217 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2869136929512024, - "train/contrastive_loss": 3.751512050628662, - "train/negative_loss": 1.5970779657363892, + "train/classification_loss": 0.16970960795879364, + "train/contrastive_loss": 0.7779986262321472, + "train/negative_loss": 0.5800029635429382, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 2.1544342041015625, - "train/total_loss": 1.0372161865234375 + "train/positive_loss": 0.19799566268920898, + "train/total_loss": 0.3253093361854553 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.1588798463344574, - "train/contrastive_loss": 0.720566987991333, - "train/negative_loss": 0.7059766054153442, + "train/classification_loss": 0.21894241869449615, + "train/contrastive_loss": 2.8856682777404785, + "train/negative_loss": 1.7207978963851929, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.014590372331440449, - "train/total_loss": 0.3029932379722595 + "train/num_positives": 8, + "train/positive_loss": 1.1648703813552856, + "train/total_loss": 0.7960760593414307 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.16977737843990326, - "train/contrastive_loss": 1.6370058059692383, - "train/negative_loss": 0.9607344269752502, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6762713193893433, - "train/total_loss": 0.4971785545349121 + "train/classification_loss": 0.14858795702457428, + "train/contrastive_loss": 1.9505035877227783, + "train/negative_loss": 0.8634089827537537, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.0870946645736694, + "train/total_loss": 0.5386886596679688 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.12604369223117828, - "train/contrastive_loss": 1.5827152729034424, - "train/negative_loss": 0.5519928336143494, - "train/num_negatives": 46, + "train/classification_loss": 0.28609156608581543, + "train/contrastive_loss": 2.2845277786254883, + "train/negative_loss": 1.8844904899597168, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.0307223796844482, - "train/total_loss": 0.4425867795944214 + "train/positive_loss": 0.40003716945648193, + "train/total_loss": 0.7429971694946289 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.2070511281490326, - "train/contrastive_loss": 1.6299370527267456, - "train/negative_loss": 1.6299370527267456, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5330385565757751 - }, - { - "epoch": 11.787072243346007, - "eval_exact_match_accuracy": 0.31238095238095237, - "eval_hamming_loss": 0.06621848739495799, - "eval_loss": 0.5649543404579163, - "eval_macro_f1": 0.3742865936920889, - "eval_macro_precision": 0.6100450801319299, - "eval_macro_recall": 0.3057762089229254, - "eval_micro_f1": 0.5781584582441114, - "eval_micro_precision": 0.7758620689655172, - "eval_micro_recall": 0.46075085324232085, - "eval_runtime": 2.633, - "eval_samples_per_second": 199.392, - "eval_steps_per_second": 25.066, + "train/classification_loss": 0.14781293272972107, + "train/contrastive_loss": 0.9626945853233337, + "train/negative_loss": 0.8595737814903259, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 0.103120818734169, + "train/total_loss": 0.3403518497943878 + }, + { + "epoch": 10.915492957746478, + "eval_exact_match_accuracy": 0.30158730158730157, + "eval_hamming_loss": 0.06608569353667393, + "eval_loss": 0.5665774941444397, + "eval_macro_f1": 0.41538974594908723, + "eval_macro_precision": 0.6422816414068047, + "eval_macro_recall": 0.3289031447309365, + "eval_micro_f1": 0.5542337298810357, + "eval_micro_precision": 0.8065173116089613, + "eval_micro_recall": 0.42217484008528783, + "eval_runtime": 2.8429, + "eval_samples_per_second": 199.446, + "eval_steps_per_second": 24.975, "step": 3100 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.09084462374448776, - "train/contrastive_loss": 0.9179635643959045, - "train/negative_loss": 0.8824095129966736, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.03555404767394066, - "train/total_loss": 0.2744373381137848 + "train/classification_loss": 0.16276085376739502, + "train/contrastive_loss": 1.175837516784668, + "train/negative_loss": 0.42145830392837524, + "train/num_negatives": 40, + "train/num_positives": 6, + "train/positive_loss": 0.754379153251648, + "train/total_loss": 0.3979283571243286 }, { - "epoch": 11.787072243346007, + "epoch": 10.915492957746478, "step": 3100, - "train/classification_loss": 0.10937536507844925, - "train/contrastive_loss": 1.5805728435516357, - "train/negative_loss": 1.2420498132705688, + "train/classification_loss": 0.0897907018661499, + "train/contrastive_loss": 0.2587071359157562, + "train/negative_loss": 0.19876466691493988, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.3385230600833893, - "train/total_loss": 0.4254899322986603 + "train/positive_loss": 0.059942472726106644, + "train/total_loss": 0.14153212308883667 }, { - "epoch": 11.977186311787072, - "grad_norm": 5.860901355743408, - "learning_rate": 1.9536225266362256e-05, - "loss": 0.5616, + "epoch": 11.091549295774648, + "grad_norm": 5.6430487632751465, + "learning_rate": 1.9570683579985908e-05, + "loss": 0.579, "step": 3150 }, { - "epoch": 11.977186311787072, + "epoch": 11.091549295774648, "step": 3150, - "train/classification_loss": 0.1773376762866974, - "train/contrastive_loss": 1.1457643508911133, - "train/negative_loss": 0.5096114277839661, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.636152982711792, - "train/total_loss": 0.4064905643463135 + "train/classification_loss": 0.12388253211975098, + "train/contrastive_loss": 0.2602914869785309, + "train/negative_loss": 0.25685280561447144, + "train/num_negatives": 38, + "train/num_positives": 18, + "train/positive_loss": 0.00343866809271276, + "train/total_loss": 0.17594082653522491 }, { - "epoch": 11.977186311787072, + "epoch": 11.091549295774648, "step": 3150, - "train/classification_loss": 0.17062102258205414, - "train/contrastive_loss": 1.6250792741775513, - "train/negative_loss": 0.4169893264770508, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.2080899477005005, - "train/total_loss": 0.49563688039779663 + "train/classification_loss": 0.10799126327037811, + "train/contrastive_loss": 0.43816837668418884, + "train/negative_loss": 0.20483598113059998, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.23333239555358887, + "train/total_loss": 0.1956249475479126 }, { - "epoch": 12.167300380228136, - "grad_norm": 10.641016960144043, - "learning_rate": 1.952861491628615e-05, - "loss": 0.5365, + "epoch": 11.267605633802816, + "grad_norm": 4.246716022491455, + "learning_rate": 1.9563636363636366e-05, + "loss": 0.5639, "step": 3200 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.3033762574195862, - "train/contrastive_loss": 2.032956838607788, - "train/negative_loss": 1.1869540214538574, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 0.8460027575492859, - "train/total_loss": 0.7099676132202148 + "train/classification_loss": 0.2657213509082794, + "train/contrastive_loss": 2.4152140617370605, + "train/negative_loss": 1.125178337097168, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.2900358438491821, + "train/total_loss": 0.748764157295227 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16638611257076263, - "train/contrastive_loss": 1.9070720672607422, - "train/negative_loss": 1.2472889423370361, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.659783124923706, - "train/total_loss": 0.5478005409240723 + "train/classification_loss": 0.2557452321052551, + "train/contrastive_loss": 0.7766358256340027, + "train/negative_loss": 0.4335929751396179, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.34304285049438477, + "train/total_loss": 0.41107240319252014 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19036902487277985, - "train/contrastive_loss": 1.069595456123352, - "train/negative_loss": 0.16125185787677765, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.9083436131477356, - "train/total_loss": 0.404288113117218 + "train/classification_loss": 0.24305664002895355, + "train/contrastive_loss": 2.6732258796691895, + "train/negative_loss": 1.402230978012085, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 1.270994782447815, + "train/total_loss": 0.7777018547058105 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.24167661368846893, - "train/contrastive_loss": 2.309422492980957, - "train/negative_loss": 1.3799318075180054, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9294906258583069, - "train/total_loss": 0.7035611271858215 + "train/classification_loss": 0.17530137300491333, + "train/contrastive_loss": 2.785922050476074, + "train/negative_loss": 2.2605278491973877, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5253943204879761, + "train/total_loss": 0.7324857711791992 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.10584332048892975, - "train/contrastive_loss": 1.3375616073608398, - "train/negative_loss": 0.7546820044517517, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5828795433044434, - "train/total_loss": 0.3733556270599365 + "train/classification_loss": 0.19417934119701385, + "train/contrastive_loss": 2.4107208251953125, + "train/negative_loss": 2.1431233882904053, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.267597496509552, + "train/total_loss": 0.6763235330581665 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.17665204405784607, - "train/contrastive_loss": 1.799314022064209, - "train/negative_loss": 1.5228673219680786, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.27644675970077515, - "train/total_loss": 0.5365148782730103 + "train/classification_loss": 0.2095743864774704, + "train/contrastive_loss": 2.0488786697387695, + "train/negative_loss": 1.1765451431274414, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.8723334074020386, + "train/total_loss": 0.6193501353263855 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.21638691425323486, - "train/contrastive_loss": 2.6364150047302246, - "train/negative_loss": 1.5924241542816162, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.0439907312393188, - "train/total_loss": 0.7436699271202087 + "train/classification_loss": 0.1819399893283844, + "train/contrastive_loss": 1.5255699157714844, + "train/negative_loss": 0.6970598697662354, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.8285099864006042, + "train/total_loss": 0.4870539903640747 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.17018739879131317, - "train/contrastive_loss": 2.2428979873657227, - "train/negative_loss": 1.962437391281128, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.2804606854915619, - "train/total_loss": 0.6187670230865479 + "train/classification_loss": 0.18864093720912933, + "train/contrastive_loss": 1.0019463300704956, + "train/negative_loss": 1.0014688968658447, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.00047742793685756624, + "train/total_loss": 0.38903021812438965 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1404886245727539, - "train/contrastive_loss": 1.4072303771972656, - "train/negative_loss": 1.3032842874526978, + "train/classification_loss": 0.10362506657838821, + "train/contrastive_loss": 0.5058585405349731, + "train/negative_loss": 0.28313660621643066, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.10394608229398727, - "train/total_loss": 0.42193469405174255 + "train/positive_loss": 0.22272193431854248, + "train/total_loss": 0.20479677617549896 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.3515789806842804, - "train/contrastive_loss": 2.9253363609313965, - "train/negative_loss": 1.1635918617248535, + "train/classification_loss": 0.1796669065952301, + "train/contrastive_loss": 2.56162428855896, + "train/negative_loss": 1.7271939516067505, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.761744499206543, - "train/total_loss": 0.9366462230682373 + "train/num_positives": 14, + "train/positive_loss": 0.8344303369522095, + "train/total_loss": 0.6919918060302734 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19104784727096558, - "train/contrastive_loss": 2.4911301136016846, - "train/negative_loss": 1.6188042163848877, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8723259568214417, - "train/total_loss": 0.6892738342285156 + "train/classification_loss": 0.14753808081150055, + "train/contrastive_loss": 1.4757665395736694, + "train/negative_loss": 0.9883856773376465, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.48738083243370056, + "train/total_loss": 0.4426913857460022 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1205240860581398, - "train/contrastive_loss": 1.825246810913086, - "train/negative_loss": 0.6261725425720215, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.1990742683410645, - "train/total_loss": 0.4855734407901764 + "train/classification_loss": 0.16208414733409882, + "train/contrastive_loss": 1.2481707334518433, + "train/negative_loss": 1.0363537073135376, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.21181702613830566, + "train/total_loss": 0.41171830892562866 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.17279472947120667, - "train/contrastive_loss": 2.9953222274780273, - "train/negative_loss": 1.5381007194519043, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4572213888168335, - "train/total_loss": 0.7718591690063477 + "train/classification_loss": 0.19019164144992828, + "train/contrastive_loss": 3.2874152660369873, + "train/negative_loss": 1.6921882629394531, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.5952270030975342, + "train/total_loss": 0.8476746678352356 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.09712737053632736, - "train/contrastive_loss": 0.608148992061615, - "train/negative_loss": 0.6081073880195618, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 4.1615116060711443e-05, - "train/total_loss": 0.21875716745853424 + "train/classification_loss": 0.15533556044101715, + "train/contrastive_loss": 1.011749505996704, + "train/negative_loss": 0.698829174041748, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.3129202723503113, + "train/total_loss": 0.3576854467391968 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1067199632525444, - "train/contrastive_loss": 1.1914440393447876, - "train/negative_loss": 1.1772253513336182, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.014218712225556374, - "train/total_loss": 0.3450087606906891 + "train/classification_loss": 0.14520874619483948, + "train/contrastive_loss": 2.6112098693847656, + "train/negative_loss": 0.7664363980293274, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.844773530960083, + "train/total_loss": 0.6674507856369019 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1366107314825058, - "train/contrastive_loss": 1.2487602233886719, - "train/negative_loss": 0.5439838171005249, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.704776406288147, - "train/total_loss": 0.38636279106140137 + "train/classification_loss": 0.14024148881435394, + "train/contrastive_loss": 0.7283188104629517, + "train/negative_loss": 0.2680666446685791, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.46025216579437256, + "train/total_loss": 0.28590524196624756 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2283368557691574, - "train/contrastive_loss": 2.487314224243164, - "train/negative_loss": 1.3222020864486694, - "train/num_negatives": 40, + "train/classification_loss": 0.11755108833312988, + "train/contrastive_loss": 1.118392825126648, + "train/negative_loss": 0.544413149356842, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.1651121377944946, - "train/total_loss": 0.7257996797561646 + "train/positive_loss": 0.5739796757698059, + "train/total_loss": 0.3412296772003174 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19261862337589264, - "train/contrastive_loss": 1.7370685338974, - "train/negative_loss": 0.3487166166305542, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.3883519172668457, - "train/total_loss": 0.5400323271751404 + "train/classification_loss": 0.17467555403709412, + "train/contrastive_loss": 1.3797621726989746, + "train/negative_loss": 0.34697166085243225, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 1.0327905416488647, + "train/total_loss": 0.45062798261642456 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.17281222343444824, - "train/contrastive_loss": 0.623302698135376, - "train/negative_loss": 0.6063300967216492, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.01697259210050106, - "train/total_loss": 0.2974727749824524 + "train/classification_loss": 0.15240579843521118, + "train/contrastive_loss": 2.2916314601898193, + "train/negative_loss": 1.2864196300506592, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 1.0052118301391602, + "train/total_loss": 0.6107320785522461 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.13490571081638336, - "train/contrastive_loss": 1.0188074111938477, - "train/negative_loss": 0.5202519297599792, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4985555410385132, - "train/total_loss": 0.33866721391677856 + "train/classification_loss": 0.22683919966220856, + "train/contrastive_loss": 3.8062803745269775, + "train/negative_loss": 1.1943809986114502, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.6118993759155273, + "train/total_loss": 0.9880952835083008 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19602683186531067, - "train/contrastive_loss": 1.7045906782150269, - "train/negative_loss": 0.33503493666648865, - "train/num_negatives": 44, + "train/classification_loss": 0.1141100600361824, + "train/contrastive_loss": 1.0588958263397217, + "train/negative_loss": 1.0526171922683716, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.3695557117462158, - "train/total_loss": 0.5369449853897095 + "train/positive_loss": 0.006278581917285919, + "train/total_loss": 0.3258892297744751 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.24770492315292358, - "train/contrastive_loss": 1.958275318145752, - "train/negative_loss": 1.5418590307235718, - "train/num_negatives": 44, + "train/classification_loss": 0.1382991522550583, + "train/contrastive_loss": 2.9155030250549316, + "train/negative_loss": 2.0782766342163086, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.4164162576198578, - "train/total_loss": 0.6393599510192871 + "train/positive_loss": 0.8372265100479126, + "train/total_loss": 0.7213997840881348 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.15128859877586365, - "train/contrastive_loss": 1.7519009113311768, - "train/negative_loss": 0.708453357219696, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.043447494506836, - "train/total_loss": 0.5016688108444214 + "train/classification_loss": 0.13700391352176666, + "train/contrastive_loss": 1.6794188022613525, + "train/negative_loss": 1.38852858543396, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.2908901572227478, + "train/total_loss": 0.47288769483566284 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.15752431750297546, - "train/contrastive_loss": 1.3301414251327515, - "train/negative_loss": 0.29534101486206055, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 1.034800410270691, - "train/total_loss": 0.42355260252952576 + "train/classification_loss": 0.22930797934532166, + "train/contrastive_loss": 1.8620128631591797, + "train/negative_loss": 1.4810782670974731, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.38093459606170654, + "train/total_loss": 0.6017105579376221 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1069546565413475, - "train/contrastive_loss": 1.303917646408081, - "train/negative_loss": 0.3673633337020874, + "train/classification_loss": 0.16875040531158447, + "train/contrastive_loss": 2.291365146636963, + "train/negative_loss": 1.2841113805770874, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9365543723106384, - "train/total_loss": 0.36773818731307983 + "train/num_positives": 10, + "train/positive_loss": 1.007253646850586, + "train/total_loss": 0.627023458480835 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.27935081720352173, - "train/contrastive_loss": 2.094120740890503, - "train/negative_loss": 0.4884014427661896, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.6057193279266357, - "train/total_loss": 0.6981749534606934 + "train/classification_loss": 0.22738637030124664, + "train/contrastive_loss": 3.314983606338501, + "train/negative_loss": 2.4215595722198486, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.8934239745140076, + "train/total_loss": 0.8903830647468567 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2696740925312042, - "train/contrastive_loss": 3.470874309539795, - "train/negative_loss": 1.6296273469924927, + "train/classification_loss": 0.18316414952278137, + "train/contrastive_loss": 1.8833078145980835, + "train/negative_loss": 1.883018136024475, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.8412468433380127, - "train/total_loss": 0.9638489484786987 + "train/num_positives": 4, + "train/positive_loss": 0.00028972988366149366, + "train/total_loss": 0.5598257184028625 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16703344881534576, - "train/contrastive_loss": 3.0512685775756836, - "train/negative_loss": 2.211282730102539, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.8399858474731445, - "train/total_loss": 0.7772871851921082 + "train/classification_loss": 0.17130056023597717, + "train/contrastive_loss": 0.2737555503845215, + "train/negative_loss": 0.23766019940376282, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.03609533980488777, + "train/total_loss": 0.2260516732931137 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.20218901336193085, - "train/contrastive_loss": 0.9792959690093994, - "train/negative_loss": 0.7226622700691223, - "train/num_negatives": 40, + "train/classification_loss": 0.2610934376716614, + "train/contrastive_loss": 2.8144679069519043, + "train/negative_loss": 1.6672781705856323, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.2566337287425995, - "train/total_loss": 0.3980482220649719 - }, - { - "epoch": 12.167300380228136, - "step": 3200, - "train/classification_loss": 0.23004037141799927, - "train/contrastive_loss": 0.9204249382019043, - "train/negative_loss": 0.6168329119682312, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.3035920560359955, - "train/total_loss": 0.41412538290023804 - }, - { - "epoch": 12.167300380228136, - "step": 3200, - "train/classification_loss": 0.1120409369468689, - "train/contrastive_loss": 1.1696833372116089, - "train/negative_loss": 0.32636550068855286, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8433178663253784, - "train/total_loss": 0.3459776043891907 + "train/positive_loss": 1.147189736366272, + "train/total_loss": 0.8239870071411133 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.22430598735809326, - "train/contrastive_loss": 2.4750232696533203, - "train/negative_loss": 0.9886041283607483, + "train/classification_loss": 0.18560656905174255, + "train/contrastive_loss": 0.6844651103019714, + "train/negative_loss": 0.6806688904762268, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4864192008972168, - "train/total_loss": 0.7193106412887573 + "train/num_positives": 10, + "train/positive_loss": 0.003796215867623687, + "train/total_loss": 0.3224995732307434 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.26892510056495667, - "train/contrastive_loss": 1.1921851634979248, - "train/negative_loss": 1.1921066045761108, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 7.856200681999326e-05, - "train/total_loss": 0.5073621273040771 + "train/classification_loss": 0.17031270265579224, + "train/contrastive_loss": 1.5365175008773804, + "train/negative_loss": 1.4684834480285645, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.0680341050028801, + "train/total_loss": 0.47761622071266174 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16998811066150665, - "train/contrastive_loss": 0.931289792060852, - "train/negative_loss": 0.8713828921318054, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.05990688130259514, - "train/total_loss": 0.35624605417251587 + "train/classification_loss": 0.15797072649002075, + "train/contrastive_loss": 2.588449478149414, + "train/negative_loss": 2.09267258644104, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.4957770109176636, + "train/total_loss": 0.6756606101989746 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.20049183070659637, - "train/contrastive_loss": 2.745680093765259, - "train/negative_loss": 2.44014835357666, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.3055317997932434, - "train/total_loss": 0.7496278882026672 + "train/classification_loss": 0.1835637092590332, + "train/contrastive_loss": 1.3325707912445068, + "train/negative_loss": 0.6118554472923279, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.7207152843475342, + "train/total_loss": 0.4500778615474701 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16538883745670319, - "train/contrastive_loss": 3.0061659812927246, - "train/negative_loss": 1.208335280418396, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7978308200836182, - "train/total_loss": 0.766622006893158 + "train/classification_loss": 0.23642148077487946, + "train/contrastive_loss": 2.7995941638946533, + "train/negative_loss": 1.9201481342315674, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.8794460296630859, + "train/total_loss": 0.79634028673172 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.14624306559562683, - "train/contrastive_loss": 1.8024122714996338, - "train/negative_loss": 1.106402039527893, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.6960102319717407, - "train/total_loss": 0.506725549697876 + "train/classification_loss": 0.23108001053333282, + "train/contrastive_loss": 1.940598726272583, + "train/negative_loss": 1.0866413116455078, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.8539574146270752, + "train/total_loss": 0.6191997528076172 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.14847755432128906, - "train/contrastive_loss": 0.8771008253097534, - "train/negative_loss": 0.8754758834838867, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.001624950091354549, - "train/total_loss": 0.32389771938323975 + "train/classification_loss": 0.15691709518432617, + "train/contrastive_loss": 2.119863748550415, + "train/negative_loss": 2.119856357574463, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 7.459197604475776e-06, + "train/total_loss": 0.5808898210525513 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19007787108421326, - "train/contrastive_loss": 1.489441990852356, - "train/negative_loss": 1.4064072370529175, + "train/classification_loss": 0.19563058018684387, + "train/contrastive_loss": 2.2068891525268555, + "train/negative_loss": 0.7632665634155273, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.08303475379943848, - "train/total_loss": 0.48796626925468445 + "train/positive_loss": 1.4436225891113281, + "train/total_loss": 0.6370084285736084 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16741175949573517, - "train/contrastive_loss": 2.34466552734375, - "train/negative_loss": 2.3379292488098145, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.006736206356436014, - "train/total_loss": 0.636344850063324 + "train/classification_loss": 0.23053982853889465, + "train/contrastive_loss": 2.235748529434204, + "train/negative_loss": 1.96981680393219, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.2659316658973694, + "train/total_loss": 0.6776895523071289 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1563311517238617, - "train/contrastive_loss": 0.7958816885948181, - "train/negative_loss": 0.7319616675376892, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0639200359582901, - "train/total_loss": 0.3155074715614319 + "train/classification_loss": 0.2153698056936264, + "train/contrastive_loss": 0.7962314486503601, + "train/negative_loss": 0.3385002911090851, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.457731157541275, + "train/total_loss": 0.3746160864830017 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.18411007523536682, - "train/contrastive_loss": 3.288682460784912, - "train/negative_loss": 2.4887263774871826, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.7999560832977295, - "train/total_loss": 0.8418465852737427 + "train/classification_loss": 0.2736409604549408, + "train/contrastive_loss": 4.180439472198486, + "train/negative_loss": 1.5394563674926758, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 2.6409831047058105, + "train/total_loss": 1.1097288131713867 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.1687142699956894, + "train/contrastive_loss": 1.5914890766143799, + "train/negative_loss": 1.19833505153656, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.3931540548801422, + "train/total_loss": 0.4870120882987976 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.20760221779346466, - "train/contrastive_loss": 0.7590461373329163, - "train/negative_loss": 0.3164156675338745, + "train/classification_loss": 0.18804609775543213, + "train/contrastive_loss": 2.65848708152771, + "train/negative_loss": 1.5354578495025635, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.44263046979904175, - "train/total_loss": 0.35941144824028015 + "train/num_positives": 14, + "train/positive_loss": 1.1230292320251465, + "train/total_loss": 0.719743549823761 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.14207352697849274, - "train/contrastive_loss": 2.183028221130371, - "train/negative_loss": 1.5825159549713135, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6005121469497681, - "train/total_loss": 0.5786792039871216 + "train/classification_loss": 0.15927208960056305, + "train/contrastive_loss": 0.6541785001754761, + "train/negative_loss": 0.6539868712425232, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 0.0001916557375807315, + "train/total_loss": 0.290107786655426 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.24697287380695343, + "train/contrastive_loss": 0.8290350437164307, + "train/negative_loss": 0.7988327145576477, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.03020232729613781, + "train/total_loss": 0.41277986764907837 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1540694385766983, - "train/contrastive_loss": 1.5937228202819824, - "train/negative_loss": 0.9881273508071899, + "train/classification_loss": 0.15328232944011688, + "train/contrastive_loss": 0.5345073342323303, + "train/negative_loss": 0.525547444820404, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6055954694747925, - "train/total_loss": 0.47281402349472046 + "train/num_positives": 12, + "train/positive_loss": 0.008959909901022911, + "train/total_loss": 0.26018381118774414 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2790834903717041, - "train/contrastive_loss": 1.5263618230819702, - "train/negative_loss": 1.1600666046142578, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.3662952184677124, - "train/total_loss": 0.5843558311462402 + "train/classification_loss": 0.35116690397262573, + "train/contrastive_loss": 2.0803022384643555, + "train/negative_loss": 0.9331258535385132, + "train/num_negatives": 30, + "train/num_positives": 18, + "train/positive_loss": 1.1471765041351318, + "train/total_loss": 0.7672273516654968 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.1320287138223648, + "train/contrastive_loss": 2.4381017684936523, + "train/negative_loss": 0.8239127397537231, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.6141890287399292, + "train/total_loss": 0.6196490526199341 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.19773712754249573, + "train/contrastive_loss": 3.7626452445983887, + "train/negative_loss": 3.1881208419799805, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.5745243430137634, + "train/total_loss": 0.9502662420272827 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.11503975093364716, - "train/contrastive_loss": 0.7865913510322571, - "train/negative_loss": 0.785078227519989, + "train/classification_loss": 0.28499636054039, + "train/contrastive_loss": 2.309828042984009, + "train/negative_loss": 2.309826612472534, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.0015131181571632624, - "train/total_loss": 0.2723580300807953 + "train/num_positives": 2, + "train/positive_loss": 1.3113030945532955e-06, + "train/total_loss": 0.7469619512557983 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1274508833885193, - "train/contrastive_loss": 1.3444256782531738, - "train/negative_loss": 0.3971507251262665, - "train/num_negatives": 38, + "train/classification_loss": 0.196963831782341, + "train/contrastive_loss": 3.1224212646484375, + "train/negative_loss": 1.2401056289672852, + "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.9472749829292297, - "train/total_loss": 0.39633601903915405 + "train/positive_loss": 1.8823156356811523, + "train/total_loss": 0.8214480876922607 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.08278388530015945, - "train/contrastive_loss": 0.5228685140609741, - "train/negative_loss": 0.510187566280365, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.012680970132350922, - "train/total_loss": 0.1873575896024704 + "train/classification_loss": 0.11312103271484375, + "train/contrastive_loss": 0.1012469157576561, + "train/negative_loss": 0.08254464715719223, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.018702266737818718, + "train/total_loss": 0.13337041437625885 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1775798797607422, - "train/contrastive_loss": 1.0535132884979248, - "train/negative_loss": 0.19155652821063995, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.8619567155838013, - "train/total_loss": 0.38828253746032715 + "train/classification_loss": 0.19312772154808044, + "train/contrastive_loss": 0.7449637651443481, + "train/negative_loss": 0.6785001158714294, + "train/num_negatives": 40, + "train/num_positives": 8, + "train/positive_loss": 0.06646361947059631, + "train/total_loss": 0.3421204686164856 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.15417589247226715, - "train/contrastive_loss": 2.052126407623291, - "train/negative_loss": 0.6602099537849426, - "train/num_negatives": 42, + "train/classification_loss": 0.1988956779241562, + "train/contrastive_loss": 1.525086760520935, + "train/negative_loss": 1.246677041053772, + "train/num_negatives": 38, "train/num_positives": 14, - "train/positive_loss": 1.3919165134429932, - "train/total_loss": 0.5646011829376221 + "train/positive_loss": 0.2784097194671631, + "train/total_loss": 0.5039130449295044 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.15233255922794342, - "train/contrastive_loss": 0.36858218908309937, - "train/negative_loss": 0.3653091490268707, - "train/num_negatives": 50, + "train/classification_loss": 0.27779915928840637, + "train/contrastive_loss": 2.391793966293335, + "train/negative_loss": 0.9761002659797668, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 0.0032730349339544773, - "train/total_loss": 0.22604900598526 + "train/positive_loss": 1.4156936407089233, + "train/total_loss": 0.7561579942703247 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2255382388830185, - "train/contrastive_loss": 3.477546215057373, - "train/negative_loss": 1.4942020177841187, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.9833440780639648, - "train/total_loss": 0.9210475087165833 + "train/classification_loss": 0.1357644945383072, + "train/contrastive_loss": 0.4140526056289673, + "train/negative_loss": 0.22338993847370148, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.19066265225410461, + "train/total_loss": 0.21857501566410065 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2347419559955597, - "train/contrastive_loss": 2.4350502490997314, - "train/negative_loss": 1.3265058994293213, + "train/classification_loss": 0.12739631533622742, + "train/contrastive_loss": 0.8716710805892944, + "train/negative_loss": 0.6946232914924622, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 1.1085443496704102, - "train/total_loss": 0.7217520475387573 + "train/positive_loss": 0.17704780399799347, + "train/total_loss": 0.30173051357269287 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.15808850526809692, + "train/contrastive_loss": 2.0376715660095215, + "train/negative_loss": 0.7465929388999939, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.2910786867141724, + "train/total_loss": 0.5656228065490723 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.19309452176094055, - "train/contrastive_loss": 1.8463294506072998, - "train/negative_loss": 0.5466159582138062, + "train/classification_loss": 0.1801939159631729, + "train/contrastive_loss": 2.3404970169067383, + "train/negative_loss": 0.9966110587120056, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.343885898590088, + "train/total_loss": 0.6482933163642883 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.19381454586982727, + "train/contrastive_loss": 1.2143474817276, + "train/negative_loss": 0.7627474665641785, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.45160001516342163, + "train/total_loss": 0.4366840422153473 + }, + { + "epoch": 11.267605633802816, + "step": 3200, + "train/classification_loss": 0.09656321257352829, + "train/contrastive_loss": 0.42125219106674194, + "train/negative_loss": 0.4189333915710449, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.2997134923934937, - "train/total_loss": 0.562360405921936 + "train/num_positives": 16, + "train/positive_loss": 0.0023188029881566763, + "train/total_loss": 0.18081365525722504 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16538842022418976, - "train/contrastive_loss": 3.255952835083008, - "train/negative_loss": 1.673946499824524, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5820064544677734, - "train/total_loss": 0.8165789842605591 + "train/classification_loss": 0.19637297093868256, + "train/contrastive_loss": 2.6825804710388184, + "train/negative_loss": 1.944100260734558, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.738480269908905, + "train/total_loss": 0.7328891158103943 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.267682284116745, - "train/contrastive_loss": 3.6064724922180176, - "train/negative_loss": 1.5830355882644653, + "train/classification_loss": 0.22072051465511322, + "train/contrastive_loss": 1.3003768920898438, + "train/negative_loss": 1.2969356775283813, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.023437023162842, - "train/total_loss": 0.9889768362045288 + "train/num_positives": 2, + "train/positive_loss": 0.0034412278328090906, + "train/total_loss": 0.4807959198951721 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.24742025136947632, - "train/contrastive_loss": 3.805393695831299, - "train/negative_loss": 1.9693572521209717, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8360363245010376, - "train/total_loss": 1.008499026298523 + "train/classification_loss": 0.15202614665031433, + "train/contrastive_loss": 2.108879327774048, + "train/negative_loss": 0.9631352424621582, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.1457440853118896, + "train/total_loss": 0.5738019943237305 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.18610572814941406, - "train/contrastive_loss": 2.3434958457946777, - "train/negative_loss": 1.1567860841751099, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.1867096424102783, - "train/total_loss": 0.6548049449920654 + "train/classification_loss": 0.18210817873477936, + "train/contrastive_loss": 1.1530498266220093, + "train/negative_loss": 0.9356790781021118, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.21737070381641388, + "train/total_loss": 0.41271814703941345 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.21046297252178192, - "train/contrastive_loss": 4.43275260925293, - "train/negative_loss": 1.8159997463226318, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.616753101348877, - "train/total_loss": 1.0970134735107422 + "train/classification_loss": 0.17568279802799225, + "train/contrastive_loss": 2.3337693214416504, + "train/negative_loss": 0.6237368583679199, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.71003258228302, + "train/total_loss": 0.642436683177948 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.24071921408176422, - "train/contrastive_loss": 2.161190986633301, - "train/negative_loss": 1.0341713428497314, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.1270196437835693, - "train/total_loss": 0.6729574203491211 + "train/classification_loss": 0.15240773558616638, + "train/contrastive_loss": 2.2747690677642822, + "train/negative_loss": 2.2747669219970703, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.0265620150894392e-06, + "train/total_loss": 0.6073615550994873 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.2693048417568207, - "train/contrastive_loss": 3.193943500518799, - "train/negative_loss": 1.0889304876327515, + "train/classification_loss": 0.15467776358127594, + "train/contrastive_loss": 0.8875606060028076, + "train/negative_loss": 0.38291463255882263, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 2.105012893676758, - "train/total_loss": 0.9080935716629028 + "train/positive_loss": 0.5046459436416626, + "train/total_loss": 0.3321898877620697 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.14936432242393494, - "train/contrastive_loss": 0.45334184169769287, - "train/negative_loss": 0.45321619510650635, + "train/classification_loss": 0.2030763179063797, + "train/contrastive_loss": 2.305759906768799, + "train/negative_loss": 1.2035760879516602, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00012563244672492146, - "train/total_loss": 0.24003270268440247 + "train/num_positives": 8, + "train/positive_loss": 1.1021839380264282, + "train/total_loss": 0.6642283201217651 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.16658197343349457, - "train/contrastive_loss": 1.590714931488037, - "train/negative_loss": 1.0675523281097412, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.5231626033782959, - "train/total_loss": 0.4847249388694763 + "train/classification_loss": 0.15912555158138275, + "train/contrastive_loss": 1.9390206336975098, + "train/negative_loss": 0.7214970588684082, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.2175235748291016, + "train/total_loss": 0.546929657459259 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.1354908049106598, - "train/contrastive_loss": 1.8387157917022705, - "train/negative_loss": 0.6697853207588196, - "train/num_negatives": 46, + "train/classification_loss": 0.26647865772247314, + "train/contrastive_loss": 1.6334317922592163, + "train/negative_loss": 1.2446074485778809, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 1.1689305305480957, - "train/total_loss": 0.5032339692115784 + "train/positive_loss": 0.38882434368133545, + "train/total_loss": 0.5931650400161743 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.18398000299930573, - "train/contrastive_loss": 1.5330724716186523, - "train/negative_loss": 1.5330724716186523, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.4905945062637329 - }, - { - "epoch": 12.167300380228136, - "eval_exact_match_accuracy": 0.30666666666666664, - "eval_hamming_loss": 0.06554621848739496, - "eval_loss": 0.5636638402938843, - "eval_macro_f1": 0.3811535693291102, - "eval_macro_precision": 0.6418427349749282, - "eval_macro_recall": 0.29213060309280214, - "eval_micro_f1": 0.5695364238410596, - "eval_micro_precision": 0.80625, - "eval_micro_recall": 0.4402730375426621, - "eval_runtime": 2.6242, - "eval_samples_per_second": 200.057, - "eval_steps_per_second": 25.15, + "train/classification_loss": 0.17929764091968536, + "train/contrastive_loss": 0.8770337700843811, + "train/negative_loss": 0.8769389986991882, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 9.478629363002256e-05, + "train/total_loss": 0.3547043800354004 + }, + { + "epoch": 11.267605633802816, + "eval_exact_match_accuracy": 0.30864197530864196, + "eval_hamming_loss": 0.06753812636165578, + "eval_loss": 0.5526972413063049, + "eval_macro_f1": 0.41685994852399694, + "eval_macro_precision": 0.5955618442810778, + "eval_macro_recall": 0.3481723928585303, + "eval_micro_f1": 0.5680159256801592, + "eval_micro_precision": 0.7521968365553603, + "eval_micro_recall": 0.4562899786780384, + "eval_runtime": 2.8463, + "eval_samples_per_second": 199.209, + "eval_steps_per_second": 24.945, "step": 3200 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.13711850345134735, - "train/contrastive_loss": 2.8926241397857666, - "train/negative_loss": 0.7703518271446228, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 2.122272253036499, - "train/total_loss": 0.7156433463096619 + "train/classification_loss": 0.20883125066757202, + "train/contrastive_loss": 0.7995290756225586, + "train/negative_loss": 0.5994036793708801, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.20012541115283966, + "train/total_loss": 0.3687370717525482 }, { - "epoch": 12.167300380228136, + "epoch": 11.267605633802816, "step": 3200, - "train/classification_loss": 0.10086507350206375, - "train/contrastive_loss": 0.30810239911079407, - "train/negative_loss": 0.3079071044921875, - "train/num_negatives": 22, - "train/num_positives": 16, - "train/positive_loss": 0.0001952886814251542, - "train/total_loss": 0.16248555481433868 + "train/classification_loss": 0.08999417722225189, + "train/contrastive_loss": 0.4491097927093506, + "train/negative_loss": 0.44908660650253296, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.318649785593152e-05, + "train/total_loss": 0.1798161268234253 }, { - "epoch": 12.357414448669202, - "grad_norm": 14.26032543182373, - "learning_rate": 1.9521004566210045e-05, - "loss": 0.5355, + "epoch": 11.443661971830986, + "grad_norm": 11.294279098510742, + "learning_rate": 1.9556589147286824e-05, + "loss": 0.564, "step": 3250 }, { - "epoch": 12.357414448669202, + "epoch": 11.443661971830986, "step": 3250, - "train/classification_loss": 0.12856727838516235, - "train/contrastive_loss": 0.6080208420753479, - "train/negative_loss": 0.6059679985046387, - "train/num_negatives": 48, + "train/classification_loss": 0.10319013148546219, + "train/contrastive_loss": 0.5846144556999207, + "train/negative_loss": 0.5358230471611023, + "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.0020528684835880995, - "train/total_loss": 0.2501714527606964 + "train/positive_loss": 0.04879140853881836, + "train/total_loss": 0.22011302411556244 }, { - "epoch": 12.357414448669202, + "epoch": 11.443661971830986, "step": 3250, - "train/classification_loss": 0.061175744980573654, - "train/contrastive_loss": 0.6554795503616333, - "train/negative_loss": 0.655462920665741, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 1.6641793990856968e-05, - "train/total_loss": 0.1922716647386551 + "train/classification_loss": 0.109939806163311, + "train/contrastive_loss": 1.1497458219528198, + "train/negative_loss": 1.0219770669937134, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.12776875495910645, + "train/total_loss": 0.33988896012306213 }, { - "epoch": 12.547528517110266, - "grad_norm": 8.37732219696045, - "learning_rate": 1.9513394216133943e-05, - "loss": 0.5288, + "epoch": 11.619718309859154, + "grad_norm": 6.208378791809082, + "learning_rate": 1.9549541930937282e-05, + "loss": 0.5965, "step": 3300 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.34707939624786377, - "train/contrastive_loss": 2.2800052165985107, - "train/negative_loss": 0.8693315386772156, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.4106736183166504, - "train/total_loss": 0.8030804395675659 + "train/classification_loss": 0.271824449300766, + "train/contrastive_loss": 2.7425999641418457, + "train/negative_loss": 1.4797563552856445, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.2628434896469116, + "train/total_loss": 0.8203444480895996 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.15195316076278687, - "train/contrastive_loss": 1.1858899593353271, - "train/negative_loss": 0.8546020984649658, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.33128783106803894, - "train/total_loss": 0.3891311585903168 + "train/classification_loss": 0.2308635115623474, + "train/contrastive_loss": 0.5782185792922974, + "train/negative_loss": 0.40379682183265686, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.1744217574596405, + "train/total_loss": 0.3465072214603424 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.17095470428466797, - "train/contrastive_loss": 1.1405926942825317, - "train/negative_loss": 0.23351936042308807, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.9070733785629272, - "train/total_loss": 0.3990732431411743 + "train/classification_loss": 0.2390766143798828, + "train/contrastive_loss": 2.477250099182129, + "train/negative_loss": 1.5003087520599365, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9769412875175476, + "train/total_loss": 0.7345266342163086 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.22500792145729065, - "train/contrastive_loss": 3.5760860443115234, - "train/negative_loss": 2.1551015377044678, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4209843873977661, - "train/total_loss": 0.9402251243591309 + "train/classification_loss": 0.1614062339067459, + "train/contrastive_loss": 2.4115052223205566, + "train/negative_loss": 1.9254984855651855, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.48600685596466064, + "train/total_loss": 0.643707275390625 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.10647831857204437, - "train/contrastive_loss": 1.5577906370162964, - "train/negative_loss": 1.1333181858062744, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.42447248101234436, - "train/total_loss": 0.41803646087646484 + "train/classification_loss": 0.2126631736755371, + "train/contrastive_loss": 2.995148181915283, + "train/negative_loss": 2.3923137187957764, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.6028344631195068, + "train/total_loss": 0.8116928339004517 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.17271435260772705, - "train/contrastive_loss": 1.7051204442977905, - "train/negative_loss": 1.270073652267456, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.4350467622280121, - "train/total_loss": 0.5137384533882141 + "train/classification_loss": 0.2108817845582962, + "train/contrastive_loss": 2.171492099761963, + "train/negative_loss": 1.3912353515625, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.7802567481994629, + "train/total_loss": 0.6451802253723145 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2132800668478012, - "train/contrastive_loss": 2.241168975830078, - "train/negative_loss": 1.0480597019195557, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.193109154701233, - "train/total_loss": 0.6615138649940491 + "train/classification_loss": 0.17042870819568634, + "train/contrastive_loss": 1.3452556133270264, + "train/negative_loss": 0.9358770847320557, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.4093785583972931, + "train/total_loss": 0.4394798278808594 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.14746928215026855, - "train/contrastive_loss": 1.566650152206421, - "train/negative_loss": 0.9876781105995178, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5789721012115479, - "train/total_loss": 0.46079930663108826 + "train/classification_loss": 0.17551346123218536, + "train/contrastive_loss": 1.0474576950073242, + "train/negative_loss": 1.0466018915176392, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.000855811988003552, + "train/total_loss": 0.38500499725341797 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.12846985459327698, - "train/contrastive_loss": 0.9369268417358398, - "train/negative_loss": 0.9175481200218201, + "train/classification_loss": 0.10680711269378662, + "train/contrastive_loss": 0.8097406625747681, + "train/negative_loss": 0.6321636438369751, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.019378717988729477, - "train/total_loss": 0.3158552050590515 + "train/positive_loss": 0.17757698893547058, + "train/total_loss": 0.2687552571296692 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.3209705352783203, - "train/contrastive_loss": 2.314624309539795, - "train/negative_loss": 1.0588639974594116, + "train/classification_loss": 0.17906393110752106, + "train/contrastive_loss": 3.3575968742370605, + "train/negative_loss": 2.1975290775299072, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2557601928710938, - "train/total_loss": 0.7838953733444214 + "train/num_positives": 14, + "train/positive_loss": 1.1600677967071533, + "train/total_loss": 0.8505833148956299 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1761116087436676, - "train/contrastive_loss": 2.5818777084350586, - "train/negative_loss": 1.6032609939575195, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.9786167144775391, - "train/total_loss": 0.6924871206283569 + "train/classification_loss": 0.13731499016284943, + "train/contrastive_loss": 1.4563870429992676, + "train/negative_loss": 0.9088473916053772, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.5475396513938904, + "train/total_loss": 0.42859238386154175 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.11202000826597214, - "train/contrastive_loss": 1.2945212125778198, - "train/negative_loss": 0.3875604569911957, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9069607257843018, - "train/total_loss": 0.3709242641925812 + "train/classification_loss": 0.1645163595676422, + "train/contrastive_loss": 1.7096819877624512, + "train/negative_loss": 1.533729076385498, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.1759529560804367, + "train/total_loss": 0.5064527988433838 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.14182084798812866, - "train/contrastive_loss": 2.196415901184082, - "train/negative_loss": 1.8250938653945923, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.37132203578948975, - "train/total_loss": 0.581104040145874 + "train/classification_loss": 0.20296643674373627, + "train/contrastive_loss": 3.4124557971954346, + "train/negative_loss": 1.9307470321655273, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.4817087650299072, + "train/total_loss": 0.8854576349258423 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.10666859894990921, - "train/contrastive_loss": 2.5006303787231445, - "train/negative_loss": 2.500502824783325, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0001275109825655818, - "train/total_loss": 0.6067946553230286 + "train/classification_loss": 0.15907734632492065, + "train/contrastive_loss": 1.0022470951080322, + "train/negative_loss": 0.509635329246521, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.49261170625686646, + "train/total_loss": 0.35952675342559814 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.09579037129878998, - "train/contrastive_loss": 1.0907940864562988, - "train/negative_loss": 0.7586641907691956, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.33212992548942566, - "train/total_loss": 0.31394919753074646 + "train/classification_loss": 0.13546057045459747, + "train/contrastive_loss": 2.107813835144043, + "train/negative_loss": 0.5898329019546509, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 1.5179810523986816, + "train/total_loss": 0.5570233464241028 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.10571885108947754, - "train/contrastive_loss": 0.4522063136100769, - "train/negative_loss": 0.35225027799606323, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.09995603561401367, - "train/total_loss": 0.19616010785102844 + "train/classification_loss": 0.15548749268054962, + "train/contrastive_loss": 0.6722891330718994, + "train/negative_loss": 0.2584424316883087, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.4138466715812683, + "train/total_loss": 0.2899453043937683 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2061019092798233, - "train/contrastive_loss": 2.0403289794921875, - "train/negative_loss": 1.1245170831680298, - "train/num_negatives": 40, + "train/classification_loss": 0.10703416913747787, + "train/contrastive_loss": 1.0288366079330444, + "train/negative_loss": 0.1696818321943283, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.9158117771148682, - "train/total_loss": 0.6141676902770996 + "train/positive_loss": 0.8591547608375549, + "train/total_loss": 0.3128014802932739 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.17753906548023224, - "train/contrastive_loss": 1.597001552581787, - "train/negative_loss": 0.3656781315803528, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.2313233613967896, - "train/total_loss": 0.49693936109542847 + "train/classification_loss": 0.16292981803417206, + "train/contrastive_loss": 1.232163906097412, + "train/negative_loss": 0.3997874855995178, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.8323764801025391, + "train/total_loss": 0.4093626141548157 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19579581916332245, - "train/contrastive_loss": 1.6260998249053955, - "train/negative_loss": 1.4755096435546875, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.150590181350708, - "train/total_loss": 0.5210157632827759 + "train/classification_loss": 0.1506035178899765, + "train/contrastive_loss": 1.4524778127670288, + "train/negative_loss": 1.2619547843933105, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.19052301347255707, + "train/total_loss": 0.4410991072654724 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1328904926776886, - "train/contrastive_loss": 0.9345663785934448, - "train/negative_loss": 0.32287970185279846, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.611686646938324, - "train/total_loss": 0.31980377435684204 + "train/classification_loss": 0.22428585588932037, + "train/contrastive_loss": 2.6999354362487793, + "train/negative_loss": 1.3738682270050049, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3260670900344849, + "train/total_loss": 0.764272928237915 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.21059522032737732, - "train/contrastive_loss": 1.4967892169952393, - "train/negative_loss": 0.232171431183815, - "train/num_negatives": 44, + "train/classification_loss": 0.1076676994562149, + "train/contrastive_loss": 1.0153857469558716, + "train/negative_loss": 1.0031427145004272, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.2646178007125854, - "train/total_loss": 0.5099530816078186 + "train/positive_loss": 0.012243022210896015, + "train/total_loss": 0.31074485182762146 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2338736206293106, - "train/contrastive_loss": 1.7113239765167236, - "train/negative_loss": 0.8836838603019714, - "train/num_negatives": 44, + "train/classification_loss": 0.12680591642856598, + "train/contrastive_loss": 2.765843629837036, + "train/negative_loss": 1.9439961910247803, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 0.827640175819397, - "train/total_loss": 0.576138436794281 + "train/positive_loss": 0.8218474388122559, + "train/total_loss": 0.6799746155738831 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.14494243264198303, - "train/contrastive_loss": 1.6052589416503906, - "train/negative_loss": 0.43248888850212097, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.1727700233459473, - "train/total_loss": 0.4659942388534546 + "train/classification_loss": 0.15786993503570557, + "train/contrastive_loss": 2.2721447944641113, + "train/negative_loss": 2.185723304748535, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.08642153441905975, + "train/total_loss": 0.6122989058494568 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1403319388628006, - "train/contrastive_loss": 1.1659413576126099, - "train/negative_loss": 0.3152478039264679, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.8506935238838196, - "train/total_loss": 0.3735201954841614 + "train/classification_loss": 0.22139698266983032, + "train/contrastive_loss": 2.24672269821167, + "train/negative_loss": 1.6440731287002563, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.602649450302124, + "train/total_loss": 0.6707415580749512 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.10432655364274979, - "train/contrastive_loss": 1.8870713710784912, - "train/negative_loss": 0.6845079064369202, + "train/classification_loss": 0.1993018537759781, + "train/contrastive_loss": 3.190005302429199, + "train/negative_loss": 1.3952195644378662, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.2025634050369263, - "train/total_loss": 0.4817408323287964 + "train/num_positives": 10, + "train/positive_loss": 1.7947858572006226, + "train/total_loss": 0.8373029232025146 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.25238141417503357, - "train/contrastive_loss": 1.5280017852783203, - "train/negative_loss": 0.3892383873462677, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.138763427734375, - "train/total_loss": 0.5579817891120911 + "train/classification_loss": 0.23483437299728394, + "train/contrastive_loss": 3.165469169616699, + "train/negative_loss": 2.1562955379486084, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0091736316680908, + "train/total_loss": 0.8679282069206238 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.25066179037094116, - "train/contrastive_loss": 3.1796464920043945, - "train/negative_loss": 1.3921351432800293, + "train/classification_loss": 0.17677053809165955, + "train/contrastive_loss": 1.9858793020248413, + "train/negative_loss": 1.9858514070510864, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.7875112295150757, - "train/total_loss": 0.8865910768508911 + "train/num_positives": 4, + "train/positive_loss": 2.789558857330121e-05, + "train/total_loss": 0.5739464163780212 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.15064767003059387, - "train/contrastive_loss": 2.637294292449951, - "train/negative_loss": 2.103783369064331, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.5335108637809753, - "train/total_loss": 0.6781065464019775 + "train/classification_loss": 0.17189553380012512, + "train/contrastive_loss": 0.2384476512670517, + "train/negative_loss": 0.22739988565444946, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.011047765612602234, + "train/total_loss": 0.21958506107330322 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18495012819766998, - "train/contrastive_loss": 1.2911736965179443, - "train/negative_loss": 0.6154749989509583, - "train/num_negatives": 40, + "train/classification_loss": 0.2899576425552368, + "train/contrastive_loss": 2.3789281845092773, + "train/negative_loss": 1.3426588773727417, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.6756987571716309, - "train/total_loss": 0.44318485260009766 - }, - { - "epoch": 12.547528517110266, - "step": 3300, - "train/classification_loss": 0.19752173125743866, - "train/contrastive_loss": 0.6066567897796631, - "train/negative_loss": 0.46394142508506775, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.14271534979343414, - "train/total_loss": 0.31885308027267456 - }, - { - "epoch": 12.547528517110266, - "step": 3300, - "train/classification_loss": 0.11365702003240585, - "train/contrastive_loss": 1.6868340969085693, - "train/negative_loss": 0.7966130971908569, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8902210593223572, - "train/total_loss": 0.4510238468647003 + "train/positive_loss": 1.036269187927246, + "train/total_loss": 0.7657432556152344 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2201513648033142, - "train/contrastive_loss": 1.7348096370697021, - "train/negative_loss": 0.7903811931610107, + "train/classification_loss": 0.16905038058757782, + "train/contrastive_loss": 0.5521578788757324, + "train/negative_loss": 0.545505702495575, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9444284439086914, - "train/total_loss": 0.5671132802963257 + "train/num_positives": 10, + "train/positive_loss": 0.0066522047854959965, + "train/total_loss": 0.2794819474220276 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2728995978832245, - "train/contrastive_loss": 1.1146036386489868, - "train/negative_loss": 1.114113450050354, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0004901895299553871, - "train/total_loss": 0.4958203434944153 + "train/classification_loss": 0.1666574478149414, + "train/contrastive_loss": 1.482362985610962, + "train/negative_loss": 1.4343078136444092, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.048055149614810944, + "train/total_loss": 0.46313005685806274 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18309904634952545, - "train/contrastive_loss": 1.358994960784912, - "train/negative_loss": 0.5810627341270447, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.7779321670532227, - "train/total_loss": 0.45489805936813354 + "train/classification_loss": 0.16023311018943787, + "train/contrastive_loss": 2.428905963897705, + "train/negative_loss": 2.0511295795440674, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.37777647376060486, + "train/total_loss": 0.6460143327713013 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19440911710262299, - "train/contrastive_loss": 3.4399447441101074, - "train/negative_loss": 2.4235405921936035, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.0164040327072144, - "train/total_loss": 0.8823980689048767 + "train/classification_loss": 0.17652864754199982, + "train/contrastive_loss": 0.7080708742141724, + "train/negative_loss": 0.46254757046699524, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 0.24552331864833832, + "train/total_loss": 0.318142831325531 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18078310787677765, - "train/contrastive_loss": 2.9865708351135254, - "train/negative_loss": 1.5120012760162354, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.47456955909729, - "train/total_loss": 0.7780972719192505 + "train/classification_loss": 0.2224830836057663, + "train/contrastive_loss": 2.6854300498962402, + "train/negative_loss": 1.923003911972046, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.7624260783195496, + "train/total_loss": 0.7595691084861755 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.14805519580841064, - "train/contrastive_loss": 1.3868827819824219, - "train/negative_loss": 0.979536771774292, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.40734606981277466, - "train/total_loss": 0.4254317581653595 + "train/classification_loss": 0.2267010658979416, + "train/contrastive_loss": 1.255798101425171, + "train/negative_loss": 0.6936713457107544, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.5621267557144165, + "train/total_loss": 0.477860689163208 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1607392430305481, - "train/contrastive_loss": 0.7724603414535522, - "train/negative_loss": 0.7723907232284546, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 6.962064799154177e-05, - "train/total_loss": 0.3152313232421875 + "train/classification_loss": 0.1412009447813034, + "train/contrastive_loss": 2.1248886585235596, + "train/negative_loss": 2.124816656112671, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 7.192782504716888e-05, + "train/total_loss": 0.5661786794662476 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.21451400220394135, - "train/contrastive_loss": 1.9269927740097046, - "train/negative_loss": 1.6983675956726074, + "train/classification_loss": 0.20716820657253265, + "train/contrastive_loss": 1.4115493297576904, + "train/negative_loss": 0.539827287197113, "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.2286251336336136, - "train/total_loss": 0.5999125838279724 + "train/positive_loss": 0.8717220425605774, + "train/total_loss": 0.48947805166244507 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.17594152688980103, - "train/contrastive_loss": 1.9154447317123413, - "train/negative_loss": 1.9083101749420166, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.007134555839002132, - "train/total_loss": 0.5590304732322693 + "train/classification_loss": 0.23758310079574585, + "train/contrastive_loss": 2.8222498893737793, + "train/negative_loss": 2.2336480617523193, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.58860182762146, + "train/total_loss": 0.8020330667495728 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18166163563728333, - "train/contrastive_loss": 1.0964306592941284, - "train/negative_loss": 1.0218130350112915, + "train/classification_loss": 0.1892024725675583, + "train/contrastive_loss": 0.7085436582565308, + "train/negative_loss": 0.4332088530063629, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.27533477544784546, + "train/total_loss": 0.33091121912002563 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.2605579197406769, + "train/contrastive_loss": 3.3863043785095215, + "train/negative_loss": 1.2728831768035889, + "train/num_negatives": 42, + "train/num_positives": 8, + "train/positive_loss": 2.1134212017059326, + "train/total_loss": 0.9378187656402588 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.13022422790527344, + "train/contrastive_loss": 0.8445090055465698, + "train/negative_loss": 0.6096231937408447, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.23488584160804749, + "train/total_loss": 0.2991260290145874 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.1745436042547226, + "train/contrastive_loss": 2.0638363361358643, + "train/negative_loss": 1.2187228202819824, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 0.8451134562492371, + "train/total_loss": 0.5873108506202698 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.16936448216438293, + "train/contrastive_loss": 0.8729373216629028, + "train/negative_loss": 0.8728799223899841, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 5.740164124290459e-05, + "train/total_loss": 0.343951940536499 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.2582992613315582, + "train/contrastive_loss": 0.9566442966461182, + "train/negative_loss": 0.7929278612136841, "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 0.07461763918399811, - "train/total_loss": 0.4009477496147156 + "train/positive_loss": 0.16371645033359528, + "train/total_loss": 0.4496281147003174 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19873106479644775, - "train/contrastive_loss": 2.683650016784668, - "train/negative_loss": 1.5991264581680298, - "train/num_negatives": 36, + "train/classification_loss": 0.15283633768558502, + "train/contrastive_loss": 0.5042253136634827, + "train/negative_loss": 0.4478946626186371, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.056330662220716476, + "train/total_loss": 0.25368139147758484 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.3266153931617737, + "train/contrastive_loss": 1.5614755153656006, + "train/negative_loss": 0.4718243479728699, + "train/num_negatives": 30, "train/num_positives": 18, - "train/positive_loss": 1.0845234394073486, - "train/total_loss": 0.7354610562324524 + "train/positive_loss": 1.089651107788086, + "train/total_loss": 0.6389105319976807 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19481319189071655, - "train/contrastive_loss": 0.696881890296936, - "train/negative_loss": 0.2659606635570526, + "train/classification_loss": 0.13703817129135132, + "train/contrastive_loss": 2.47029185295105, + "train/negative_loss": 0.7654306292533875, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.7048611640930176, + "train/total_loss": 0.6310965418815613 + }, + { + "epoch": 11.619718309859154, + "step": 3300, + "train/classification_loss": 0.19289667904376984, + "train/contrastive_loss": 3.7196288108825684, + "train/negative_loss": 3.216248035430908, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.43092119693756104, - "train/total_loss": 0.33418959379196167 + "train/num_positives": 14, + "train/positive_loss": 0.5033808946609497, + "train/total_loss": 0.9368224143981934 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1410069465637207, - "train/contrastive_loss": 1.8685730695724487, - "train/negative_loss": 0.8321835994720459, + "train/classification_loss": 0.26242098212242126, + "train/contrastive_loss": 3.1307640075683594, + "train/negative_loss": 3.130762815475464, "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.0363894701004028, - "train/total_loss": 0.5147215723991394 + "train/num_positives": 2, + "train/positive_loss": 1.0728841743912199e-06, + "train/total_loss": 0.8885737657546997 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.13723044097423553, - "train/contrastive_loss": 1.071256160736084, - "train/negative_loss": 0.4372030198574066, + "train/classification_loss": 0.20656751096248627, + "train/contrastive_loss": 2.8097095489501953, + "train/negative_loss": 1.2043330669403076, "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6340531706809998, - "train/total_loss": 0.35148167610168457 + "train/num_positives": 16, + "train/positive_loss": 1.6053763628005981, + "train/total_loss": 0.7685094475746155 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2691359221935272, - "train/contrastive_loss": 1.9683219194412231, - "train/negative_loss": 0.6863564252853394, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.2819654941558838, - "train/total_loss": 0.6628003120422363 + "train/classification_loss": 0.11084030568599701, + "train/contrastive_loss": 0.1763785183429718, + "train/negative_loss": 0.09339582920074463, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.08298268169164658, + "train/total_loss": 0.14611601829528809 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1014346107840538, - "train/contrastive_loss": 0.5833827257156372, - "train/negative_loss": 0.5833801627159119, - "train/num_negatives": 48, + "train/classification_loss": 0.19506914913654327, + "train/contrastive_loss": 0.9072536826133728, + "train/negative_loss": 0.8548882603645325, + "train/num_negatives": 40, "train/num_positives": 8, - "train/positive_loss": 2.563003818067955e-06, - "train/total_loss": 0.21811115741729736 + "train/positive_loss": 0.05236539989709854, + "train/total_loss": 0.3765198886394501 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.12606041133403778, - "train/contrastive_loss": 0.7799094915390015, - "train/negative_loss": 0.4002189636230469, + "train/classification_loss": 0.16868776082992554, + "train/contrastive_loss": 1.4061518907546997, + "train/negative_loss": 1.3938604593276978, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.3796905279159546, - "train/total_loss": 0.28204232454299927 + "train/num_positives": 14, + "train/positive_loss": 0.012291480787098408, + "train/total_loss": 0.44991815090179443 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1033274307847023, - "train/contrastive_loss": 1.219914197921753, - "train/negative_loss": 0.8716353178024292, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.34827885031700134, - "train/total_loss": 0.34731027483940125 + "train/classification_loss": 0.2746620178222656, + "train/contrastive_loss": 2.0092341899871826, + "train/negative_loss": 0.8468360900878906, + "train/num_negatives": 36, + "train/num_positives": 6, + "train/positive_loss": 1.162398099899292, + "train/total_loss": 0.676508903503418 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.16940689086914062, - "train/contrastive_loss": 1.3833918571472168, - "train/negative_loss": 1.2634482383728027, - "train/num_negatives": 28, + "train/classification_loss": 0.13475558161735535, + "train/contrastive_loss": 1.2681504487991333, + "train/negative_loss": 0.4006800353527069, + "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.11994358152151108, - "train/total_loss": 0.44608527421951294 + "train/positive_loss": 0.8674704432487488, + "train/total_loss": 0.38838568329811096 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.13873925805091858, - "train/contrastive_loss": 1.7079704999923706, - "train/negative_loss": 0.618016242980957, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0899542570114136, - "train/total_loss": 0.4803333580493927 + "train/classification_loss": 0.11036793142557144, + "train/contrastive_loss": 0.643263578414917, + "train/negative_loss": 0.6143208742141724, + "train/num_negatives": 34, + "train/num_positives": 22, + "train/positive_loss": 0.028942694887518883, + "train/total_loss": 0.23902064561843872 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1556241810321808, - "train/contrastive_loss": 0.28870242834091187, - "train/negative_loss": 0.28336256742477417, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0053398460149765015, - "train/total_loss": 0.21336466073989868 + "train/classification_loss": 0.14527440071105957, + "train/contrastive_loss": 1.371785283088684, + "train/negative_loss": 0.796165406703949, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 0.5756198763847351, + "train/total_loss": 0.4196314513683319 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19701683521270752, - "train/contrastive_loss": 2.0400822162628174, - "train/negative_loss": 0.8878315687179565, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1522506475448608, - "train/total_loss": 0.605033278465271 + "train/classification_loss": 0.19375981390476227, + "train/contrastive_loss": 3.0311942100524902, + "train/negative_loss": 1.077102541923523, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 1.9540917873382568, + "train/total_loss": 0.7999986410140991 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.23069681227207184, - "train/contrastive_loss": 3.3553059101104736, - "train/negative_loss": 2.3089773654937744, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.0463285446166992, - "train/total_loss": 0.9017580151557922 + "train/classification_loss": 0.17526721954345703, + "train/contrastive_loss": 1.0896062850952148, + "train/negative_loss": 0.7854379415512085, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 0.3041682839393616, + "train/total_loss": 0.3931884765625 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.16667497158050537, - "train/contrastive_loss": 1.5509929656982422, - "train/negative_loss": 0.5426768660545349, + "train/classification_loss": 0.09320028126239777, + "train/contrastive_loss": 0.17111603915691376, + "train/negative_loss": 0.1276233047246933, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.0083160400390625, - "train/total_loss": 0.47687357664108276 + "train/num_positives": 16, + "train/positive_loss": 0.04349273815751076, + "train/total_loss": 0.127423495054245 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18547913432121277, - "train/contrastive_loss": 2.9035725593566895, - "train/negative_loss": 1.9228551387786865, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9807173609733582, - "train/total_loss": 0.7661936283111572 + "train/classification_loss": 0.20182648301124573, + "train/contrastive_loss": 2.5402181148529053, + "train/negative_loss": 1.9559324979782104, + "train/num_negatives": 40, + "train/num_positives": 10, + "train/positive_loss": 0.58428555727005, + "train/total_loss": 0.7098701000213623 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2673528492450714, - "train/contrastive_loss": 3.9384055137634277, - "train/negative_loss": 1.3883721828460693, + "train/classification_loss": 0.22756846249103546, + "train/contrastive_loss": 1.5960291624069214, + "train/negative_loss": 1.589327335357666, "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.5500333309173584, - "train/total_loss": 1.0550339221954346 + "train/num_positives": 2, + "train/positive_loss": 0.006701822858303785, + "train/total_loss": 0.5467743277549744 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.23345428705215454, - "train/contrastive_loss": 3.210688591003418, - "train/negative_loss": 1.7242555618286133, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4864330291748047, - "train/total_loss": 0.8755919933319092 + "train/classification_loss": 0.158109650015831, + "train/contrastive_loss": 1.5831613540649414, + "train/negative_loss": 0.9915891289710999, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.5915722846984863, + "train/total_loss": 0.47474193572998047 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.18227478861808777, - "train/contrastive_loss": 2.509526014328003, - "train/negative_loss": 1.3292335271835327, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.1802924871444702, - "train/total_loss": 0.6841800212860107 + "train/classification_loss": 0.18724606931209564, + "train/contrastive_loss": 1.3853458166122437, + "train/negative_loss": 1.1623528003692627, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.22299300134181976, + "train/total_loss": 0.4643152356147766 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.21538712084293365, - "train/contrastive_loss": 4.162034034729004, - "train/negative_loss": 1.7455836534500122, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.4164505004882812, - "train/total_loss": 1.047793984413147 + "train/classification_loss": 0.15005652606487274, + "train/contrastive_loss": 1.6493808031082153, + "train/negative_loss": 0.41411781311035156, + "train/num_negatives": 44, + "train/num_positives": 8, + "train/positive_loss": 1.2352629899978638, + "train/total_loss": 0.47993266582489014 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.2527192533016205, - "train/contrastive_loss": 4.841754913330078, - "train/negative_loss": 3.3343167304992676, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.507438063621521, - "train/total_loss": 1.2210702896118164 + "train/classification_loss": 0.1380922794342041, + "train/contrastive_loss": 2.0614004135131836, + "train/negative_loss": 2.0613982677459717, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.1100088360981317e-06, + "train/total_loss": 0.5503723621368408 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.3059104084968567, - "train/contrastive_loss": 3.919853925704956, - "train/negative_loss": 1.729513168334961, + "train/classification_loss": 0.15814632177352905, + "train/contrastive_loss": 1.2941360473632812, + "train/negative_loss": 0.6059972643852234, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 2.190340757369995, - "train/total_loss": 1.089881181716919 + "train/positive_loss": 0.6881387233734131, + "train/total_loss": 0.4169735312461853 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.1509193480014801, - "train/contrastive_loss": 0.626815915107727, - "train/negative_loss": 0.6266660690307617, + "train/classification_loss": 0.21540136635303497, + "train/contrastive_loss": 2.395094633102417, + "train/negative_loss": 1.565178632736206, "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00014983859728090465, - "train/total_loss": 0.27628254890441895 + "train/num_positives": 8, + "train/positive_loss": 0.8299160599708557, + "train/total_loss": 0.6944202780723572 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.14138263463974, - "train/contrastive_loss": 0.7746722102165222, - "train/negative_loss": 0.2979638874530792, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.476708322763443, - "train/total_loss": 0.29631710052490234 + "train/classification_loss": 0.14196059107780457, + "train/contrastive_loss": 1.3686342239379883, + "train/negative_loss": 0.527056872844696, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.841577410697937, + "train/total_loss": 0.4156874418258667 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.12290862202644348, - "train/contrastive_loss": 1.0597014427185059, - "train/negative_loss": 0.4957352578639984, - "train/num_negatives": 46, + "train/classification_loss": 0.2523321211338043, + "train/contrastive_loss": 2.1039605140686035, + "train/negative_loss": 1.7423510551452637, + "train/num_negatives": 44, "train/num_positives": 6, - "train/positive_loss": 0.5639661550521851, - "train/total_loss": 0.33484891057014465 + "train/positive_loss": 0.3616095781326294, + "train/total_loss": 0.6731241941452026 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.19829989969730377, - "train/contrastive_loss": 1.6958187818527222, - "train/negative_loss": 1.6958187818527222, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5374636650085449 - }, - { - "epoch": 12.547528517110266, - "eval_exact_match_accuracy": 0.3295238095238095, - "eval_hamming_loss": 0.0642016806722689, - "eval_loss": 0.5512127876281738, - "eval_macro_f1": 0.39931491562175153, - "eval_macro_precision": 0.6104142484947438, - "eval_macro_recall": 0.32805960830548575, - "eval_micro_f1": 0.5990202939118264, - "eval_micro_precision": 0.7781818181818182, - "eval_micro_recall": 0.4869169510807736, - "eval_runtime": 2.6283, - "eval_samples_per_second": 199.746, - "eval_steps_per_second": 25.111, + "train/classification_loss": 0.16454818844795227, + "train/contrastive_loss": 0.9493318200111389, + "train/negative_loss": 0.9492660760879517, + "train/num_negatives": 32, + "train/num_positives": 8, + "train/positive_loss": 6.573570135515183e-05, + "train/total_loss": 0.35441455245018005 + }, + { + "epoch": 11.619718309859154, + "eval_exact_match_accuracy": 0.31922398589065254, + "eval_hamming_loss": 0.06608569353667393, + "eval_loss": 0.5369996428489685, + "eval_macro_f1": 0.4060723084250586, + "eval_macro_precision": 0.6174204117921679, + "eval_macro_recall": 0.33369223478544824, + "eval_micro_f1": 0.5744822979291917, + "eval_micro_precision": 0.7692307692307693, + "eval_micro_recall": 0.4584221748400853, + "eval_runtime": 2.8475, + "eval_samples_per_second": 199.122, + "eval_steps_per_second": 24.934, "step": 3300 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.07876963168382645, - "train/contrastive_loss": 0.1757815033197403, - "train/negative_loss": 0.17422360181808472, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.0015579088358208537, - "train/total_loss": 0.11392593383789062 + "train/classification_loss": 0.1033724844455719, + "train/contrastive_loss": 0.595157265663147, + "train/negative_loss": 0.4263073801994324, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.168849915266037, + "train/total_loss": 0.22240394353866577 }, { - "epoch": 12.547528517110266, + "epoch": 11.619718309859154, "step": 3300, - "train/classification_loss": 0.12117116898298264, - "train/contrastive_loss": 0.33968237042427063, - "train/negative_loss": 0.33965590596199036, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.6464829716132954e-05, - "train/total_loss": 0.18910764157772064 + "train/classification_loss": 0.09682909399271011, + "train/contrastive_loss": 0.8690621256828308, + "train/negative_loss": 0.8294048309326172, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.039657287299633026, + "train/total_loss": 0.2706415355205536 }, { - "epoch": 12.737642585551331, - "grad_norm": 6.033344268798828, - "learning_rate": 1.950578386605784e-05, - "loss": 0.5257, + "epoch": 11.795774647887324, + "grad_norm": 4.02087926864624, + "learning_rate": 1.954249471458774e-05, + "loss": 0.5413, "step": 3350 }, { - "epoch": 12.737642585551331, + "epoch": 11.795774647887324, "step": 3350, - "train/classification_loss": 0.12084837257862091, - "train/contrastive_loss": 1.0402737855911255, - "train/negative_loss": 0.7185849547386169, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.32168880105018616, - "train/total_loss": 0.3289031386375427 + "train/classification_loss": 0.16480125486850739, + "train/contrastive_loss": 0.21811242401599884, + "train/negative_loss": 0.2180793583393097, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 3.306148573756218e-05, + "train/total_loss": 0.20842373371124268 }, { - "epoch": 12.737642585551331, + "epoch": 11.795774647887324, "step": 3350, - "train/classification_loss": 0.1350831687450409, - "train/contrastive_loss": 0.47328436374664307, - "train/negative_loss": 0.40987834334373474, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.06340600550174713, - "train/total_loss": 0.22974005341529846 + "train/classification_loss": 0.13820725679397583, + "train/contrastive_loss": 1.0499615669250488, + "train/negative_loss": 0.48286932706832886, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.56709223985672, + "train/total_loss": 0.3481995761394501 }, { - "epoch": 12.927756653992395, - "grad_norm": 6.303250789642334, - "learning_rate": 1.9498173515981736e-05, - "loss": 0.5438, + "epoch": 11.971830985915492, + "grad_norm": 16.348533630371094, + "learning_rate": 1.9535447498238198e-05, + "loss": 0.5809, "step": 3400 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.3234480619430542, - "train/contrastive_loss": 2.627307415008545, - "train/negative_loss": 1.420408010482788, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.2068992853164673, - "train/total_loss": 0.8489095568656921 + "train/classification_loss": 0.2864153981208801, + "train/contrastive_loss": 2.5060911178588867, + "train/negative_loss": 1.3167080879211426, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.1893829107284546, + "train/total_loss": 0.7876336574554443 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.17232373356819153, - "train/contrastive_loss": 2.0110840797424316, - "train/negative_loss": 1.5759251117706299, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.43515902757644653, - "train/total_loss": 0.5745405554771423 + "train/classification_loss": 0.2402697503566742, + "train/contrastive_loss": 1.610914707183838, + "train/negative_loss": 0.41657015681266785, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 1.1943445205688477, + "train/total_loss": 0.5624526739120483 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.18807996809482574, - "train/contrastive_loss": 1.4677977561950684, - "train/negative_loss": 0.22616758942604065, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.24163019657135, - "train/total_loss": 0.4816395044326782 + "train/classification_loss": 0.22807277739048004, + "train/contrastive_loss": 1.9831628799438477, + "train/negative_loss": 1.0569273233413696, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9262354969978333, + "train/total_loss": 0.6247053742408752 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.24672816693782806, - "train/contrastive_loss": 2.392333745956421, - "train/negative_loss": 1.4311150312423706, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9612187147140503, - "train/total_loss": 0.7251949310302734 + "train/classification_loss": 0.17550817131996155, + "train/contrastive_loss": 2.4060754776000977, + "train/negative_loss": 1.3238279819488525, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.0822473764419556, + "train/total_loss": 0.6567232608795166 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.11139974743127823, - "train/contrastive_loss": 1.7568423748016357, - "train/negative_loss": 1.2235357761383057, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5333065986633301, - "train/total_loss": 0.46276822686195374 + "train/classification_loss": 0.22617276012897491, + "train/contrastive_loss": 2.8114664554595947, + "train/negative_loss": 2.1197962760925293, + "train/num_negatives": 34, + "train/num_positives": 18, + "train/positive_loss": 0.6916702389717102, + "train/total_loss": 0.7884660363197327 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.15866495668888092, - "train/contrastive_loss": 1.3422092199325562, - "train/negative_loss": 1.2947853803634644, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.047423794865608215, - "train/total_loss": 0.4271067976951599 + "train/classification_loss": 0.22991156578063965, + "train/contrastive_loss": 3.29605770111084, + "train/negative_loss": 1.4074801206588745, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.8885774612426758, + "train/total_loss": 0.8891231417655945 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.26168277859687805, - "train/contrastive_loss": 3.1450982093811035, - "train/negative_loss": 1.5229567289352417, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.6221415996551514, - "train/total_loss": 0.890702486038208 + "train/classification_loss": 0.18757151067256927, + "train/contrastive_loss": 1.8799256086349487, + "train/negative_loss": 0.8823308944702148, + "train/num_negatives": 36, + "train/num_positives": 14, + "train/positive_loss": 0.9975947141647339, + "train/total_loss": 0.5635566115379333 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.14605562388896942, - "train/contrastive_loss": 1.7078546285629272, - "train/negative_loss": 1.3574588298797607, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3503958284854889, - "train/total_loss": 0.4876265525817871 + "train/classification_loss": 0.17693592607975006, + "train/contrastive_loss": 0.7002310156822205, + "train/negative_loss": 0.7000147104263306, + "train/num_negatives": 50, + "train/num_positives": 2, + "train/positive_loss": 0.0002163286553695798, + "train/total_loss": 0.3169821500778198 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.14486750960350037, - "train/contrastive_loss": 1.3794909715652466, - "train/negative_loss": 1.1672438383102417, + "train/classification_loss": 0.10390909016132355, + "train/contrastive_loss": 0.9423516988754272, + "train/negative_loss": 0.6986709237098694, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.21224716305732727, - "train/total_loss": 0.4207656979560852 + "train/positive_loss": 0.24368074536323547, + "train/total_loss": 0.2923794388771057 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.310205340385437, - "train/contrastive_loss": 2.6821930408477783, - "train/negative_loss": 1.2606370449066162, + "train/classification_loss": 0.16324786841869354, + "train/contrastive_loss": 2.3501038551330566, + "train/negative_loss": 1.442505121231079, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.421555995941162, - "train/total_loss": 0.8466439843177795 + "train/num_positives": 14, + "train/positive_loss": 0.9075987935066223, + "train/total_loss": 0.6332686543464661 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1719108670949936, - "train/contrastive_loss": 2.356034755706787, - "train/negative_loss": 1.5501434803009033, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8058913350105286, - "train/total_loss": 0.6431178450584412 + "train/classification_loss": 0.12983526289463043, + "train/contrastive_loss": 1.7823537588119507, + "train/negative_loss": 0.28791674971580505, + "train/num_negatives": 38, + "train/num_positives": 12, + "train/positive_loss": 1.4944369792938232, + "train/total_loss": 0.48630601167678833 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.11640714854001999, - "train/contrastive_loss": 1.502386212348938, - "train/negative_loss": 0.5223814249038696, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9800047874450684, - "train/total_loss": 0.4168843924999237 + "train/classification_loss": 0.1586899310350418, + "train/contrastive_loss": 2.7673845291137695, + "train/negative_loss": 1.4687200784683228, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 1.2986645698547363, + "train/total_loss": 0.7121668457984924 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.15294037759304047, - "train/contrastive_loss": 2.535947799682617, - "train/negative_loss": 1.5712870359420776, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.96466064453125, - "train/total_loss": 0.660129964351654 + "train/classification_loss": 0.1976153403520584, + "train/contrastive_loss": 2.9747040271759033, + "train/negative_loss": 1.6252983808517456, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.3494056463241577, + "train/total_loss": 0.7925561666488647 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.10188791900873184, - "train/contrastive_loss": 1.9406116008758545, - "train/negative_loss": 1.9405585527420044, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 5.306052480591461e-05, - "train/total_loss": 0.49001023173332214 + "train/classification_loss": 0.15510419011116028, + "train/contrastive_loss": 1.403907060623169, + "train/negative_loss": 0.6084649562835693, + "train/num_negatives": 46, + "train/num_positives": 4, + "train/positive_loss": 0.7954421043395996, + "train/total_loss": 0.43588560819625854 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.09336108714342117, - "train/contrastive_loss": 0.9571070075035095, - "train/negative_loss": 0.8648159503936768, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.09229103475809097, - "train/total_loss": 0.2847824990749359 + "train/classification_loss": 0.14470325410366058, + "train/contrastive_loss": 2.6630091667175293, + "train/negative_loss": 0.42742475867271423, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 2.2355844974517822, + "train/total_loss": 0.6773051023483276 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.10377389192581177, - "train/contrastive_loss": 0.6027169823646545, - "train/negative_loss": 0.4369102418422699, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.16580672562122345, - "train/total_loss": 0.2243172824382782 + "train/classification_loss": 0.161673441529274, + "train/contrastive_loss": 1.0393285751342773, + "train/negative_loss": 0.5355088710784912, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.5038197040557861, + "train/total_loss": 0.36953914165496826 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.22170943021774292, - "train/contrastive_loss": 2.718154191970825, - "train/negative_loss": 1.3643230199813843, - "train/num_negatives": 40, + "train/classification_loss": 0.10991991311311722, + "train/contrastive_loss": 1.0561574697494507, + "train/negative_loss": 0.1740603744983673, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.353831171989441, - "train/total_loss": 0.765340268611908 + "train/positive_loss": 0.882097065448761, + "train/total_loss": 0.32115140557289124 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.165597066283226, - "train/contrastive_loss": 1.01565420627594, - "train/negative_loss": 0.13276854157447815, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8828856348991394, - "train/total_loss": 0.3687279224395752 + "train/classification_loss": 0.17279328405857086, + "train/contrastive_loss": 1.3032574653625488, + "train/negative_loss": 0.4021962881088257, + "train/num_negatives": 26, + "train/num_positives": 20, + "train/positive_loss": 0.9010611772537231, + "train/total_loss": 0.4334447979927063 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2028965950012207, - "train/contrastive_loss": 1.2772231101989746, - "train/negative_loss": 1.0927908420562744, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.18443232774734497, - "train/total_loss": 0.45834121108055115 + "train/classification_loss": 0.15077152848243713, + "train/contrastive_loss": 1.6674673557281494, + "train/negative_loss": 0.7585099935531616, + "train/num_negatives": 42, + "train/num_positives": 10, + "train/positive_loss": 0.9089574217796326, + "train/total_loss": 0.484264999628067 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1424788385629654, - "train/contrastive_loss": 0.9390831589698792, - "train/negative_loss": 0.4723949134349823, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.46668824553489685, - "train/total_loss": 0.33029547333717346 + "train/classification_loss": 0.21579018235206604, + "train/contrastive_loss": 3.4853367805480957, + "train/negative_loss": 1.4509748220443726, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 2.0343618392944336, + "train/total_loss": 0.9128575325012207 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.23015719652175903, - "train/contrastive_loss": 1.9399150609970093, - "train/negative_loss": 0.28329575061798096, - "train/num_negatives": 44, + "train/classification_loss": 0.11221495270729065, + "train/contrastive_loss": 1.077101230621338, + "train/negative_loss": 1.0760865211486816, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.6566193103790283, - "train/total_loss": 0.6181402206420898 + "train/positive_loss": 0.0010147526627406478, + "train/total_loss": 0.3276351988315582 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2635957896709442, - "train/contrastive_loss": 2.685075283050537, - "train/negative_loss": 1.3108776807785034, - "train/num_negatives": 44, + "train/classification_loss": 0.12250817567110062, + "train/contrastive_loss": 2.709306478500366, + "train/negative_loss": 1.8837618827819824, + "train/num_negatives": 48, "train/num_positives": 8, - "train/positive_loss": 1.3741976022720337, - "train/total_loss": 0.8006108999252319 + "train/positive_loss": 0.8255445957183838, + "train/total_loss": 0.6643694639205933 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1518651694059372, - "train/contrastive_loss": 1.8658971786499023, - "train/negative_loss": 0.4518791437149048, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.4140180349349976, - "train/total_loss": 0.5250446200370789 + "train/classification_loss": 0.16665510833263397, + "train/contrastive_loss": 2.5002269744873047, + "train/negative_loss": 2.378385066986084, + "train/num_negatives": 46, + "train/num_positives": 6, + "train/positive_loss": 0.1218419224023819, + "train/total_loss": 0.666700541973114 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.15426579117774963, - "train/contrastive_loss": 1.3650071620941162, - "train/negative_loss": 0.3637980818748474, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 1.001209020614624, - "train/total_loss": 0.4272672235965729 + "train/classification_loss": 0.23845462501049042, + "train/contrastive_loss": 2.1372268199920654, + "train/negative_loss": 1.0707604885101318, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.0664663314819336, + "train/total_loss": 0.6658999919891357 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.0983562171459198, - "train/contrastive_loss": 1.508538842201233, - "train/negative_loss": 0.6112044453620911, + "train/classification_loss": 0.18439550697803497, + "train/contrastive_loss": 3.084998607635498, + "train/negative_loss": 1.116882562637329, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8973343968391418, - "train/total_loss": 0.40006399154663086 + "train/num_positives": 10, + "train/positive_loss": 1.9681161642074585, + "train/total_loss": 0.8013952374458313 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.26821720600128174, - "train/contrastive_loss": 1.8827800750732422, - "train/negative_loss": 0.3559780418872833, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.5268020629882812, - "train/total_loss": 0.6447732448577881 + "train/classification_loss": 0.22670240700244904, + "train/contrastive_loss": 2.1536686420440674, + "train/negative_loss": 1.2204763889312744, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.9331921935081482, + "train/total_loss": 0.6574361324310303 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2543896436691284, - "train/contrastive_loss": 2.8133068084716797, - "train/negative_loss": 1.4167543649673462, + "train/classification_loss": 0.1767055243253708, + "train/contrastive_loss": 1.5982882976531982, + "train/negative_loss": 1.594626545906067, "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3965524435043335, - "train/total_loss": 0.8170509934425354 + "train/num_positives": 4, + "train/positive_loss": 0.0036618048325181007, + "train/total_loss": 0.49636316299438477 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.16225335001945496, - "train/contrastive_loss": 3.4465959072113037, - "train/negative_loss": 2.726245403289795, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.7203505039215088, - "train/total_loss": 0.8515725135803223 + "train/classification_loss": 0.1886516511440277, + "train/contrastive_loss": 0.33055827021598816, + "train/negative_loss": 0.24170003831386566, + "train/num_negatives": 32, + "train/num_positives": 20, + "train/positive_loss": 0.0888582244515419, + "train/total_loss": 0.25476330518722534 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.19062389433383942, - "train/contrastive_loss": 1.785198450088501, - "train/negative_loss": 0.7517717480659485, - "train/num_negatives": 40, + "train/classification_loss": 0.2767840027809143, + "train/contrastive_loss": 2.9796955585479736, + "train/negative_loss": 1.500819206237793, + "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 1.0334266424179077, - "train/total_loss": 0.5476635694503784 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.2105678915977478, - "train/contrastive_loss": 0.7853504419326782, - "train/negative_loss": 0.5124862194061279, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.2728641927242279, - "train/total_loss": 0.3676379919052124 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.10351688414812088, - "train/contrastive_loss": 1.407652735710144, - "train/negative_loss": 0.6761858463287354, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7314668893814087, - "train/total_loss": 0.38504743576049805 + "train/positive_loss": 1.4788763523101807, + "train/total_loss": 0.8727231025695801 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.20471887290477753, - "train/contrastive_loss": 1.7054637670516968, - "train/negative_loss": 0.9719778299331665, + "train/classification_loss": 0.1781867891550064, + "train/contrastive_loss": 0.8134265542030334, + "train/negative_loss": 0.7134259939193726, "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7334859371185303, - "train/total_loss": 0.545811653137207 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.2880289554595947, - "train/contrastive_loss": 1.0999417304992676, - "train/negative_loss": 1.099518895149231, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0004228651523590088, - "train/total_loss": 0.5080173015594482 + "train/num_positives": 10, + "train/positive_loss": 0.1000005379319191, + "train/total_loss": 0.3408721089363098 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.18976879119873047, - "train/contrastive_loss": 0.9071958065032959, - "train/negative_loss": 0.4946019649505615, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.412593811750412, - "train/total_loss": 0.37120795249938965 + "train/classification_loss": 0.15018221735954285, + "train/contrastive_loss": 0.8663634657859802, + "train/negative_loss": 0.7129050493240356, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 0.1534584015607834, + "train/total_loss": 0.32345491647720337 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.18267199397087097, - "train/contrastive_loss": 2.568951368331909, - "train/negative_loss": 1.862320065498352, + "train/classification_loss": 0.14743544161319733, + "train/contrastive_loss": 2.3652307987213135, + "train/negative_loss": 1.2357358932495117, "train/num_negatives": 52, "train/num_positives": 4, - "train/positive_loss": 0.7066313028335571, - "train/total_loss": 0.6964622735977173 + "train/positive_loss": 1.1294949054718018, + "train/total_loss": 0.6204816102981567 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.17431189119815826, - "train/contrastive_loss": 2.8592896461486816, - "train/negative_loss": 1.3268438577651978, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.5324457883834839, - "train/total_loss": 0.7461698055267334 + "train/classification_loss": 0.1907016783952713, + "train/contrastive_loss": 2.2304954528808594, + "train/negative_loss": 1.0534167289733887, + "train/num_negatives": 42, + "train/num_positives": 12, + "train/positive_loss": 1.1770786046981812, + "train/total_loss": 0.6368007659912109 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1356964409351349, - "train/contrastive_loss": 1.7638190984725952, - "train/negative_loss": 1.1583133935928345, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.6055057048797607, - "train/total_loss": 0.4884602725505829 + "train/classification_loss": 0.22363734245300293, + "train/contrastive_loss": 2.555762767791748, + "train/negative_loss": 1.7651923894882202, + "train/num_negatives": 48, + "train/num_positives": 6, + "train/positive_loss": 0.7905704379081726, + "train/total_loss": 0.7347899079322815 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.17916330695152283, - "train/contrastive_loss": 1.5442063808441162, - "train/negative_loss": 1.0730016231536865, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.4712047576904297, - "train/total_loss": 0.488004595041275 + "train/classification_loss": 0.21107934415340424, + "train/contrastive_loss": 1.508976697921753, + "train/negative_loss": 0.9622426629066467, + "train/num_negatives": 44, + "train/num_positives": 6, + "train/positive_loss": 0.546734094619751, + "train/total_loss": 0.5128746628761292 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.188121497631073, - "train/contrastive_loss": 1.7028404474258423, - "train/negative_loss": 1.5757310390472412, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.1271093785762787, - "train/total_loss": 0.5286896228790283 + "train/classification_loss": 0.1506933569908142, + "train/contrastive_loss": 2.156078815460205, + "train/negative_loss": 2.156059503555298, + "train/num_negatives": 42, + "train/num_positives": 14, + "train/positive_loss": 1.9261493434896693e-05, + "train/total_loss": 0.5819091200828552 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.16467157006263733, - "train/contrastive_loss": 1.8552337884902954, - "train/negative_loss": 1.8384615182876587, + "train/classification_loss": 0.19637171924114227, + "train/contrastive_loss": 1.519548773765564, + "train/negative_loss": 0.29067566990852356, "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.016772309318184853, - "train/total_loss": 0.5357183218002319 + "train/num_positives": 8, + "train/positive_loss": 1.2288731336593628, + "train/total_loss": 0.5002814531326294 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.19487059116363525, - "train/contrastive_loss": 1.1774718761444092, - "train/negative_loss": 0.9769262671470642, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.20054565370082855, - "train/total_loss": 0.4303649663925171 + "train/classification_loss": 0.24347355961799622, + "train/contrastive_loss": 2.788450002670288, + "train/negative_loss": 2.3680341243743896, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.42041581869125366, + "train/total_loss": 0.8011635541915894 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.20121337473392487, - "train/contrastive_loss": 2.5096473693847656, - "train/negative_loss": 1.4260035753250122, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 1.0836437940597534, - "train/total_loss": 0.7031428217887878 + "train/classification_loss": 0.20849721133708954, + "train/contrastive_loss": 0.7086260318756104, + "train/negative_loss": 0.34195905923843384, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 0.3666669428348541, + "train/total_loss": 0.3502224087715149 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.20596937835216522, - "train/contrastive_loss": 1.8080418109893799, - "train/negative_loss": 0.37470105290412903, + "train/classification_loss": 0.28504258394241333, + "train/contrastive_loss": 3.280843734741211, + "train/negative_loss": 1.3918296098709106, "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.4333407878875732, - "train/total_loss": 0.5675777196884155 + "train/num_positives": 8, + "train/positive_loss": 1.8890140056610107, + "train/total_loss": 0.9412113428115845 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1521429419517517, - "train/contrastive_loss": 2.042966842651367, - "train/negative_loss": 0.7615265846252441, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.281440258026123, - "train/total_loss": 0.5607362985610962 + "train/classification_loss": 0.12758541107177734, + "train/contrastive_loss": 0.9434974193572998, + "train/negative_loss": 0.6942369341850281, + "train/num_negatives": 46, + "train/num_positives": 10, + "train/positive_loss": 0.24926047027111053, + "train/total_loss": 0.3162848949432373 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1632707267999649, - "train/contrastive_loss": 1.485603928565979, - "train/negative_loss": 0.6564373970031738, - "train/num_negatives": 40, + "train/classification_loss": 0.18063253164291382, + "train/contrastive_loss": 2.559826374053955, + "train/negative_loss": 1.1091228723526, + "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 0.8291665315628052, - "train/total_loss": 0.4603915214538574 + "train/positive_loss": 1.450703501701355, + "train/total_loss": 0.6925978064537048 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.25703391432762146, - "train/contrastive_loss": 1.640439748764038, - "train/negative_loss": 0.6920076608657837, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.9484320878982544, - "train/total_loss": 0.5851218700408936 + "train/classification_loss": 0.14654940366744995, + "train/contrastive_loss": 0.37958288192749023, + "train/negative_loss": 0.3795297145843506, + "train/num_negatives": 50, + "train/num_positives": 4, + "train/positive_loss": 5.3169023885857314e-05, + "train/total_loss": 0.22246599197387695 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.10168159753084183, - "train/contrastive_loss": 0.8801308870315552, - "train/negative_loss": 0.8799821138381958, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.00014878045476507396, - "train/total_loss": 0.2777077853679657 + "train/classification_loss": 0.2653622329235077, + "train/contrastive_loss": 0.40057963132858276, + "train/negative_loss": 0.3929031789302826, + "train/num_negatives": 50, + "train/num_positives": 6, + "train/positive_loss": 0.0076764412224292755, + "train/total_loss": 0.3454781770706177 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.12447533756494522, - "train/contrastive_loss": 1.0265800952911377, - "train/negative_loss": 0.2073023021221161, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8192777633666992, - "train/total_loss": 0.3297913670539856 + "train/classification_loss": 0.15090252459049225, + "train/contrastive_loss": 0.6711095571517944, + "train/negative_loss": 0.5360282063484192, + "train/num_negatives": 40, + "train/num_positives": 12, + "train/positive_loss": 0.13508135080337524, + "train/total_loss": 0.28512442111968994 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.10704585164785385, - "train/contrastive_loss": 1.3684585094451904, - "train/negative_loss": 0.9173287749290466, + "train/classification_loss": 0.3246062099933624, + "train/contrastive_loss": 2.254579782485962, + "train/negative_loss": 1.4058345556259155, "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.451129674911499, - "train/total_loss": 0.3807375729084015 + "train/num_positives": 18, + "train/positive_loss": 0.8487451672554016, + "train/total_loss": 0.7755221724510193 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.17465703189373016, - "train/contrastive_loss": 1.6902122497558594, - "train/negative_loss": 1.148132085800171, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.5420802235603333, - "train/total_loss": 0.5126994848251343 + "train/classification_loss": 0.1271226704120636, + "train/contrastive_loss": 2.638763427734375, + "train/negative_loss": 0.6320816874504089, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 2.0066816806793213, + "train/total_loss": 0.6548753976821899 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1370653510093689, - "train/contrastive_loss": 1.9338325262069702, - "train/negative_loss": 0.6473388671875, + "train/classification_loss": 0.18041278421878815, + "train/contrastive_loss": 2.6744189262390137, + "train/negative_loss": 2.264373302459717, "train/num_negatives": 42, "train/num_positives": 14, - "train/positive_loss": 1.2864936590194702, - "train/total_loss": 0.523831844329834 + "train/positive_loss": 0.4100455641746521, + "train/total_loss": 0.7152965664863586 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.16121484339237213, - "train/contrastive_loss": 0.44096219539642334, - "train/negative_loss": 0.4105415940284729, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.03042059764266014, - "train/total_loss": 0.24940729141235352 + "train/classification_loss": 0.300018310546875, + "train/contrastive_loss": 2.5565543174743652, + "train/negative_loss": 2.5565528869628906, + "train/num_negatives": 48, + "train/num_positives": 2, + "train/positive_loss": 1.3113030945532955e-06, + "train/total_loss": 0.811329185962677 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2159525752067566, - "train/contrastive_loss": 2.183407783508301, - "train/negative_loss": 1.07178795337677, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.1116197109222412, - "train/total_loss": 0.6526341438293457 + "train/classification_loss": 0.2101355493068695, + "train/contrastive_loss": 3.068310260772705, + "train/negative_loss": 1.3865567445755005, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 1.681753396987915, + "train/total_loss": 0.8237975835800171 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.21477432548999786, - "train/contrastive_loss": 1.6629621982574463, - "train/negative_loss": 0.9431710839271545, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7197911143302917, - "train/total_loss": 0.5473667979240417 + "train/classification_loss": 0.12214487046003342, + "train/contrastive_loss": 0.7940738797187805, + "train/negative_loss": 0.2134452909231186, + "train/num_negatives": 36, + "train/num_positives": 12, + "train/positive_loss": 0.5806285738945007, + "train/total_loss": 0.2809596359729767 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.21116185188293457, - "train/contrastive_loss": 1.9255558252334595, - "train/negative_loss": 0.41026756167411804, + "train/classification_loss": 0.21674410998821259, + "train/contrastive_loss": 0.9268835186958313, + "train/negative_loss": 0.6917107701301575, "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.515288233757019, - "train/total_loss": 0.5962730646133423 + "train/num_positives": 8, + "train/positive_loss": 0.23517273366451263, + "train/total_loss": 0.40212082862854004 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.18556249141693115, - "train/contrastive_loss": 3.155332565307617, - "train/negative_loss": 1.8614416122436523, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2938908338546753, - "train/total_loss": 0.8166289925575256 + "train/classification_loss": 0.17498879134655, + "train/contrastive_loss": 1.4075732231140137, + "train/negative_loss": 1.0333727598190308, + "train/num_negatives": 38, + "train/num_positives": 14, + "train/positive_loss": 0.37420040369033813, + "train/total_loss": 0.4565034508705139 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2694458067417145, - "train/contrastive_loss": 4.2376604080200195, - "train/negative_loss": 1.5531132221221924, - "train/num_negatives": 46, + "train/classification_loss": 0.32710063457489014, + "train/contrastive_loss": 3.023778200149536, + "train/negative_loss": 0.9421355128288269, + "train/num_negatives": 36, "train/num_positives": 6, - "train/positive_loss": 2.684546947479248, - "train/total_loss": 1.1169779300689697 + "train/positive_loss": 2.0816426277160645, + "train/total_loss": 0.9318562746047974 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.23633797466754913, - "train/contrastive_loss": 3.0634407997131348, - "train/negative_loss": 1.719818115234375, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.3436225652694702, - "train/total_loss": 0.8490261435508728 + "train/classification_loss": 0.13638830184936523, + "train/contrastive_loss": 0.8297756910324097, + "train/negative_loss": 0.26942458748817444, + "train/num_negatives": 44, + "train/num_positives": 12, + "train/positive_loss": 0.5603510737419128, + "train/total_loss": 0.3023434281349182 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1702396273612976, - "train/contrastive_loss": 1.6408214569091797, - "train/negative_loss": 0.6896739602088928, + "train/classification_loss": 0.12461970746517181, + "train/contrastive_loss": 0.5863827466964722, + "train/negative_loss": 0.35135072469711304, "train/num_negatives": 34, "train/num_positives": 22, - "train/positive_loss": 0.9511475563049316, - "train/total_loss": 0.498403936624527 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.198253333568573, - "train/contrastive_loss": 4.252507209777832, - "train/negative_loss": 1.6889605522155762, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.563546895980835, - "train/total_loss": 1.0487548112869263 + "train/positive_loss": 0.23503205180168152, + "train/total_loss": 0.24189625680446625 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2711775600910187, - "train/contrastive_loss": 4.345482349395752, - "train/negative_loss": 2.6670138835906982, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.6784684658050537, - "train/total_loss": 1.1402740478515625 + "train/classification_loss": 0.1512128710746765, + "train/contrastive_loss": 2.0193936824798584, + "train/negative_loss": 0.9081525206565857, + "train/num_negatives": 52, + "train/num_positives": 4, + "train/positive_loss": 1.111241102218628, + "train/total_loss": 0.5550916194915771 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.2955111265182495, - "train/contrastive_loss": 3.2295145988464355, - "train/negative_loss": 1.6806541681289673, + "train/classification_loss": 0.20463521778583527, + "train/contrastive_loss": 2.241032123565674, + "train/negative_loss": 1.4335198402404785, "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.5488604307174683, - "train/total_loss": 0.9414140582084656 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.15682178735733032, - "train/contrastive_loss": 0.7344776391983032, - "train/negative_loss": 0.7328202128410339, - "train/num_negatives": 48, "train/num_positives": 4, - "train/positive_loss": 0.00165742717217654, - "train/total_loss": 0.30371731519699097 + "train/positive_loss": 0.8075124025344849, + "train/total_loss": 0.6528416275978088 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.1472228318452835, - "train/contrastive_loss": 0.9769076108932495, - "train/negative_loss": 0.19700390100479126, + "train/classification_loss": 0.19932608306407928, + "train/contrastive_loss": 1.1772005558013916, + "train/negative_loss": 0.46148422360420227, "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7799037098884583, - "train/total_loss": 0.3426043391227722 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.11231127381324768, - "train/contrastive_loss": 1.0902435779571533, - "train/negative_loss": 0.25961020588874817, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.8306333422660828, - "train/total_loss": 0.3303599953651428 - }, - { - "epoch": 12.927756653992395, - "step": 3400, - "train/classification_loss": 0.2001384049654007, - "train/contrastive_loss": 1.6484830379486084, - "train/negative_loss": 1.6484830379486084, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.529835045337677 - }, - { - "epoch": 12.927756653992395, - "eval_exact_match_accuracy": 0.3142857142857143, - "eval_hamming_loss": 0.06532212885154062, - "eval_loss": 0.5668320655822754, - "eval_macro_f1": 0.3991935987374441, - "eval_macro_precision": 0.6077078713174527, - "eval_macro_recall": 0.3220673542155757, - "eval_micro_f1": 0.583868665239115, - "eval_micro_precision": 0.7835249042145593, - "eval_micro_recall": 0.4653014789533561, - "eval_runtime": 2.6317, - "eval_samples_per_second": 199.493, - "eval_steps_per_second": 25.079, - "step": 3400 + "train/num_positives": 12, + "train/positive_loss": 0.7157163619995117, + "train/total_loss": 0.4347662031650543 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.049722738564014435, - "train/contrastive_loss": 0.2603868842124939, - "train/negative_loss": 0.12564344704151154, - "train/num_negatives": 36, - "train/num_positives": 20, - "train/positive_loss": 0.13474345207214355, - "train/total_loss": 0.1018001139163971 + "train/classification_loss": 0.07740391045808792, + "train/contrastive_loss": 0.21475635468959808, + "train/negative_loss": 0.18394051492214203, + "train/num_negatives": 40, + "train/num_positives": 16, + "train/positive_loss": 0.030815843492746353, + "train/total_loss": 0.12035518139600754 }, { - "epoch": 12.927756653992395, + "epoch": 11.971830985915492, "step": 3400, - "train/classification_loss": 0.0589284747838974, - "train/contrastive_loss": 0.2904653251171112, - "train/negative_loss": 0.2898704409599304, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.0005948820617049932, - "train/total_loss": 0.11702154576778412 - }, - { - "epoch": 13.11787072243346, - "grad_norm": 7.749636173248291, - "learning_rate": 1.9490563165905634e-05, - "loss": 0.4982, - "step": 3450 - }, - { - "epoch": 13.11787072243346, - "step": 3450, - "train/classification_loss": 0.13003812730312347, - "train/contrastive_loss": 2.1832239627838135, - "train/negative_loss": 1.4360803365707397, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.747143566608429, - "train/total_loss": 0.5666829347610474 - }, - { - "epoch": 13.11787072243346, - "step": 3450, - "train/classification_loss": 0.12459120899438858, - "train/contrastive_loss": 0.6128494143486023, - "train/negative_loss": 0.44227415323257446, - "train/num_negatives": 46, + "train/classification_loss": 0.20169365406036377, + "train/contrastive_loss": 2.285486936569214, + "train/negative_loss": 1.5728172063827515, + "train/num_negatives": 40, "train/num_positives": 10, - "train/positive_loss": 0.17057524621486664, - "train/total_loss": 0.24716109037399292 - }, - { - "epoch": 13.307984790874524, - "grad_norm": 3.7602009773254395, - "learning_rate": 1.948295281582953e-05, - "loss": 0.513, - "step": 3500 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.3131314516067505, - "train/contrastive_loss": 2.204012155532837, - "train/negative_loss": 0.6376218795776367, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.5663902759552002, - "train/total_loss": 0.7539339065551758 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1535107046365738, - "train/contrastive_loss": 1.759305715560913, - "train/negative_loss": 1.1754164695739746, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5838891863822937, - "train/total_loss": 0.5053718686103821 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.18301917612552643, - "train/contrastive_loss": 2.090938091278076, - "train/negative_loss": 0.8717172145843506, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.2192209959030151, - "train/total_loss": 0.6012067794799805 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2281382530927658, - "train/contrastive_loss": 3.5178351402282715, - "train/negative_loss": 2.0448684692382812, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4729667901992798, - "train/total_loss": 0.9317052960395813 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.09628544747829437, - "train/contrastive_loss": 1.4005948305130005, - "train/negative_loss": 1.001780390739441, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.39881446957588196, - "train/total_loss": 0.37640440464019775 + "train/positive_loss": 0.7126697897911072, + "train/total_loss": 0.6587910652160645 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.15823350846767426, - "train/contrastive_loss": 1.4336771965026855, - "train/negative_loss": 1.1870166063308716, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.20289531350135803, + "train/contrastive_loss": 1.0738251209259033, + "train/negative_loss": 1.0522583723068237, "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.2466605305671692, - "train/total_loss": 0.44496893882751465 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2304578572511673, - "train/contrastive_loss": 2.8146204948425293, - "train/negative_loss": 1.158129096031189, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.6564912796020508, - "train/total_loss": 0.793381929397583 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1451205462217331, - "train/contrastive_loss": 1.855086088180542, - "train/negative_loss": 0.9408150911331177, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9142710566520691, - "train/total_loss": 0.5161377787590027 + "train/num_positives": 2, + "train/positive_loss": 0.021566739305853844, + "train/total_loss": 0.41766035556793213 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.12891337275505066, - "train/contrastive_loss": 0.9516881108283997, - "train/negative_loss": 0.9352684020996094, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.16088584065437317, + "train/contrastive_loss": 2.5070641040802, + "train/negative_loss": 1.0180082321166992, "train/num_negatives": 44, "train/num_positives": 12, - "train/positive_loss": 0.01641969382762909, - "train/total_loss": 0.31925100088119507 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2704474627971649, - "train/contrastive_loss": 2.361619472503662, - "train/negative_loss": 1.2551683187484741, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1064510345458984, - "train/total_loss": 0.7427713871002197 + "train/positive_loss": 1.489055871963501, + "train/total_loss": 0.6622986793518066 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1654253900051117, - "train/contrastive_loss": 2.4619863033294678, - "train/negative_loss": 1.5235306024551392, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.18439029157161713, + "train/contrastive_loss": 1.3094674348831177, + "train/negative_loss": 0.7377079129219055, "train/num_negatives": 40, "train/num_positives": 16, - "train/positive_loss": 0.9384557604789734, - "train/total_loss": 0.6578226685523987 + "train/positive_loss": 0.5717595219612122, + "train/total_loss": 0.446283757686615 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.09823053330183029, - "train/contrastive_loss": 0.9201090335845947, - "train/negative_loss": 0.35931649804115295, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.171571284532547, + "train/contrastive_loss": 2.0250818729400635, + "train/negative_loss": 0.44625118374824524, "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.5607925653457642, - "train/total_loss": 0.28225234150886536 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.14059631526470184, - "train/contrastive_loss": 1.8943357467651367, - "train/negative_loss": 1.67543363571167, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.21890217065811157, - "train/total_loss": 0.5194634795188904 + "train/num_positives": 8, + "train/positive_loss": 1.578830599784851, + "train/total_loss": 0.5765876770019531 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.10235808789730072, - "train/contrastive_loss": 2.4080779552459717, - "train/negative_loss": 2.407440662384033, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0006373624783009291, - "train/total_loss": 0.5839737057685852 + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.12282082438468933, + "train/contrastive_loss": 0.7972508072853088, + "train/negative_loss": 0.7972486615180969, + "train/num_negatives": 34, + "train/num_positives": 20, + "train/positive_loss": 2.1338505575840827e-06, + "train/total_loss": 0.28227096796035767 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.09681634604930878, - "train/contrastive_loss": 1.1973892450332642, - "train/negative_loss": 1.1230719089508057, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.16165323555469513, + "train/contrastive_loss": 1.1839613914489746, + "train/negative_loss": 0.4316282272338867, "train/num_negatives": 46, "train/num_positives": 10, - "train/positive_loss": 0.0743173137307167, - "train/total_loss": 0.3362942039966583 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1098785549402237, - "train/contrastive_loss": 0.5822588205337524, - "train/negative_loss": 0.29130819439888, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.29095062613487244, - "train/total_loss": 0.22633031010627747 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2172199934720993, - "train/contrastive_loss": 2.7216129302978516, - "train/negative_loss": 1.303812861442566, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.4178001880645752, - "train/total_loss": 0.7615426182746887 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.15756334364414215, - "train/contrastive_loss": 1.2826542854309082, - "train/negative_loss": 0.4519054889678955, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8307488560676575, - "train/total_loss": 0.4140942096710205 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.19557613134384155, - "train/contrastive_loss": 1.2099467515945435, - "train/negative_loss": 1.0798031091690063, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.1301436871290207, - "train/total_loss": 0.43756550550460815 + "train/positive_loss": 0.7523331046104431, + "train/total_loss": 0.3984455168247223 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.14083486795425415, - "train/contrastive_loss": 1.401590347290039, - "train/negative_loss": 0.3321691155433655, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.0694212913513184, - "train/total_loss": 0.4211529493331909 + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.20239406824111938, + "train/contrastive_loss": 2.348005533218384, + "train/negative_loss": 1.31099534034729, + "train/num_negatives": 48, + "train/num_positives": 8, + "train/positive_loss": 1.0370101928710938, + "train/total_loss": 0.6719951629638672 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.24091802537441254, - "train/contrastive_loss": 1.543561339378357, - "train/negative_loss": 0.16771619021892548, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.16138069331645966, + "train/contrastive_loss": 2.599496841430664, + "train/negative_loss": 1.0955849885940552, "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.375845193862915, - "train/total_loss": 0.5496302843093872 + "train/num_positives": 12, + "train/positive_loss": 1.5039119720458984, + "train/total_loss": 0.6812800765037537 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.24372498691082, - "train/contrastive_loss": 2.069575309753418, - "train/negative_loss": 1.0528819561004639, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.2602480351924896, + "train/contrastive_loss": 1.3008562326431274, + "train/negative_loss": 0.9205397367477417, "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.0166934728622437, - "train/total_loss": 0.6576400399208069 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.11970577389001846, - "train/contrastive_loss": 1.3424845933914185, - "train/negative_loss": 0.2969638407230377, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.0455207824707031, - "train/total_loss": 0.3882026970386505 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.150417760014534, - "train/contrastive_loss": 1.411935806274414, - "train/negative_loss": 0.43394002318382263, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.9779958128929138, - "train/total_loss": 0.4328049421310425 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.08575480431318283, - "train/contrastive_loss": 1.176153302192688, - "train/negative_loss": 0.2997775971889496, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.876375675201416, - "train/total_loss": 0.32098546624183655 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.275573194026947, - "train/contrastive_loss": 1.7516385316848755, - "train/negative_loss": 0.11636717617511749, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.6352713108062744, - "train/total_loss": 0.6259008646011353 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2601527273654938, - "train/contrastive_loss": 3.3322978019714355, - "train/negative_loss": 1.46917724609375, - "train/num_negatives": 50, "train/num_positives": 6, - "train/positive_loss": 1.863120436668396, - "train/total_loss": 0.9266122579574585 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1617715209722519, - "train/contrastive_loss": 3.77871036529541, - "train/negative_loss": 2.8002867698669434, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.9784234762191772, - "train/total_loss": 0.9175136089324951 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1813303679227829, - "train/contrastive_loss": 1.2024568319320679, - "train/negative_loss": 0.6160652041435242, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5863916277885437, - "train/total_loss": 0.4218217432498932 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.21104778349399567, - "train/contrastive_loss": 0.8336138725280762, - "train/negative_loss": 0.6470433473587036, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.18657052516937256, - "train/total_loss": 0.3777705430984497 + "train/positive_loss": 0.38031646609306335, + "train/total_loss": 0.5204192996025085 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.10607516020536423, - "train/contrastive_loss": 1.0436350107192993, - "train/negative_loss": 0.6289663314819336, + "epoch": 11.971830985915492, + "step": 3400, + "train/classification_loss": 0.1769106090068817, + "train/contrastive_loss": 0.6750936508178711, + "train/negative_loss": 0.6715583801269531, "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.4146687090396881, - "train/total_loss": 0.3148021697998047 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.20633763074874878, - "train/contrastive_loss": 2.135221004486084, - "train/negative_loss": 1.0959765911102295, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.039244294166565, - "train/total_loss": 0.6333818435668945 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2199014574289322, - "train/contrastive_loss": 0.7407516241073608, - "train/negative_loss": 0.7406655550003052, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 8.607281051808968e-05, - "train/total_loss": 0.36805176734924316 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.20986421406269073, - "train/contrastive_loss": 1.7018868923187256, - "train/negative_loss": 0.4987223744392395, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.2031644582748413, - "train/total_loss": 0.5502415895462036 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1960906684398651, - "train/contrastive_loss": 3.8441429138183594, - "train/negative_loss": 2.3418595790863037, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.5022833347320557, - "train/total_loss": 0.9649192094802856 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.17097105085849762, - "train/contrastive_loss": 3.099560260772705, - "train/negative_loss": 1.3702149391174316, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7293452024459839, - "train/total_loss": 0.7908831238746643 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.13676251471042633, - "train/contrastive_loss": 1.4467281103134155, - "train/negative_loss": 1.1450998783111572, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.3016282320022583, - "train/total_loss": 0.42610812187194824 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.16720405220985413, - "train/contrastive_loss": 2.020986318588257, - "train/negative_loss": 0.9906620383262634, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.0303242206573486, - "train/total_loss": 0.5714013576507568 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1777028888463974, - "train/contrastive_loss": 1.9261013269424438, - "train/negative_loss": 1.9006317853927612, - "train/num_negatives": 46, "train/num_positives": 8, - "train/positive_loss": 0.025469493120908737, - "train/total_loss": 0.5629231333732605 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1851765662431717, - "train/contrastive_loss": 2.2849249839782715, - "train/negative_loss": 2.2591965198516846, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.025728436186909676, - "train/total_loss": 0.6421615481376648 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.19457857310771942, - "train/contrastive_loss": 1.2570396661758423, - "train/negative_loss": 1.2089214324951172, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.04811820387840271, - "train/total_loss": 0.4459865093231201 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1657150387763977, - "train/contrastive_loss": 2.4308700561523438, - "train/negative_loss": 1.690561056137085, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.7403090000152588, - "train/total_loss": 0.6518890857696533 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.20465660095214844, - "train/contrastive_loss": 2.245161533355713, - "train/negative_loss": 0.4563505947589874, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.7888109683990479, - "train/total_loss": 0.653688907623291 + "train/positive_loss": 0.00353529816493392, + "train/total_loss": 0.3119293451309204 + }, + { + "epoch": 11.971830985915492, + "eval_exact_match_accuracy": 0.31746031746031744, + "eval_hamming_loss": 0.0665006743438116, + "eval_loss": 0.5517120361328125, + "eval_macro_f1": 0.4510166791146767, + "eval_macro_precision": 0.6677478588667094, + "eval_macro_recall": 0.3737002146225135, + "eval_micro_f1": 0.5706630944407234, + "eval_micro_precision": 0.7675675675675676, + "eval_micro_recall": 0.4541577825159915, + "eval_runtime": 2.8549, + "eval_samples_per_second": 198.606, + "eval_steps_per_second": 24.869, + "step": 3400 }, { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1428832858800888, - "train/contrastive_loss": 1.9721620082855225, - "train/negative_loss": 1.0565400123596191, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.9156219363212585, - "train/total_loss": 0.5373156666755676 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.12321621924638748, - "train/contrastive_loss": 1.1471898555755615, - "train/negative_loss": 0.3549638092517853, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.7922260165214539, - "train/total_loss": 0.35265418887138367 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.25577035546302795, - "train/contrastive_loss": 1.7958661317825317, - "train/negative_loss": 0.7080191373825073, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.0878469944000244, - "train/total_loss": 0.6149436235427856 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1022467315196991, - "train/contrastive_loss": 0.8800197839736938, - "train/negative_loss": 0.8800182342529297, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.5199198060145136e-06, - "train/total_loss": 0.27825069427490234 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.12307079881429672, - "train/contrastive_loss": 0.5416824817657471, - "train/negative_loss": 0.23000074923038483, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.31168174743652344, - "train/total_loss": 0.2314072996377945 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.10861074179410934, - "train/contrastive_loss": 1.512770414352417, - "train/negative_loss": 1.1104238033294678, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.4023466110229492, - "train/total_loss": 0.4111648499965668 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1633157730102539, - "train/contrastive_loss": 1.3757665157318115, - "train/negative_loss": 1.3486353158950806, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.02713124454021454, - "train/total_loss": 0.4384690821170807 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.12319750338792801, - "train/contrastive_loss": 1.7038747072219849, - "train/negative_loss": 0.716539204120636, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9873355031013489, - "train/total_loss": 0.46397244930267334 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1621861308813095, - "train/contrastive_loss": 0.3981439769268036, - "train/negative_loss": 0.3950132727622986, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0031307083554565907, - "train/total_loss": 0.24181492626667023 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.20635348558425903, - "train/contrastive_loss": 3.258335590362549, - "train/negative_loss": 1.137306571006775, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 2.1210289001464844, - "train/total_loss": 0.8580206036567688 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.20026642084121704, - "train/contrastive_loss": 2.0913925170898438, - "train/negative_loss": 1.5255707502365112, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5658218860626221, - "train/total_loss": 0.6185449361801147 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.15809932351112366, - "train/contrastive_loss": 1.5681979656219482, - "train/negative_loss": 0.5708395838737488, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9973583221435547, - "train/total_loss": 0.47173893451690674 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.18379944562911987, - "train/contrastive_loss": 3.337881565093994, - "train/negative_loss": 1.724287986755371, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.613593578338623, - "train/total_loss": 0.8513757586479187 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2740629017353058, - "train/contrastive_loss": 4.115637302398682, - "train/negative_loss": 1.337350606918335, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.7782866954803467, - "train/total_loss": 1.0971903800964355 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.24254518747329712, - "train/contrastive_loss": 3.468578338623047, - "train/negative_loss": 1.788881778717041, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.6796964406967163, - "train/total_loss": 0.9362608790397644 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.14695322513580322, - "train/contrastive_loss": 1.3741494417190552, - "train/negative_loss": 0.6822147369384766, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6919347047805786, - "train/total_loss": 0.42178311944007874 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2452550232410431, - "train/contrastive_loss": 4.567511558532715, - "train/negative_loss": 1.7903480529785156, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.7771637439727783, - "train/total_loss": 1.1587573289871216 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2671532928943634, - "train/contrastive_loss": 5.24977445602417, - "train/negative_loss": 3.8407533168792725, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.4090211391448975, - "train/total_loss": 1.317108154296875 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.30294525623321533, - "train/contrastive_loss": 3.58787202835083, - "train/negative_loss": 1.713004469871521, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.8748676776885986, - "train/total_loss": 1.020519733428955 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1466289758682251, - "train/contrastive_loss": 0.7722367644309998, - "train/negative_loss": 0.7715141773223877, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0007226017769426107, - "train/total_loss": 0.30107635259628296 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1543886661529541, - "train/contrastive_loss": 1.0247857570648193, - "train/negative_loss": 0.19244001805782318, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8323457837104797, - "train/total_loss": 0.35934582352638245 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.1072419136762619, - "train/contrastive_loss": 1.1919615268707275, - "train/negative_loss": 0.3452797532081604, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.8466817736625671, - "train/total_loss": 0.34563422203063965 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.2113160640001297, - "train/contrastive_loss": 1.7817565202713013, - "train/negative_loss": 1.7817565202713013, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5676673650741577 - }, - { - "epoch": 13.307984790874524, - "eval_exact_match_accuracy": 0.32761904761904764, - "eval_hamming_loss": 0.06442577030812324, - "eval_loss": 0.571475625038147, - "eval_macro_f1": 0.41669425466792404, - "eval_macro_precision": 0.5618890682339962, - "eval_macro_recall": 0.35526899933994144, - "eval_micro_f1": 0.6085772634445201, - "eval_micro_precision": 0.7576271186440678, - "eval_micro_recall": 0.5085324232081911, - "eval_runtime": 2.6399, - "eval_samples_per_second": 198.872, - "eval_steps_per_second": 25.001, - "step": 3500 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.09495767951011658, - "train/contrastive_loss": 0.7753824591636658, - "train/negative_loss": 0.7749974131584167, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00038505051634274423, - "train/total_loss": 0.2500341534614563 - }, - { - "epoch": 13.307984790874524, - "step": 3500, - "train/classification_loss": 0.06983800232410431, - "train/contrastive_loss": 0.3031214475631714, - "train/negative_loss": 0.3031124770641327, - "train/num_negatives": 26, - "train/num_positives": 30, - "train/positive_loss": 8.972544492280576e-06, - "train/total_loss": 0.13046228885650635 - }, - { - "epoch": 13.49809885931559, - "grad_norm": 11.85250473022461, - "learning_rate": 1.9475342465753427e-05, - "loss": 0.4845, - "step": 3550 - }, - { - "epoch": 13.49809885931559, - "step": 3550, - "train/classification_loss": 0.12904711067676544, - "train/contrastive_loss": 0.331440806388855, - "train/negative_loss": 0.32976680994033813, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 0.001673982129432261, - "train/total_loss": 0.1953352689743042 - }, - { - "epoch": 13.49809885931559, - "step": 3550, - "train/classification_loss": 0.08709616959095001, - "train/contrastive_loss": 0.6265957951545715, - "train/negative_loss": 0.6219338178634644, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.004661986604332924, - "train/total_loss": 0.21241533756256104 - }, - { - "epoch": 13.688212927756654, - "grad_norm": 7.076729774475098, - "learning_rate": 1.9467732115677322e-05, - "loss": 0.4844, - "step": 3600 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.335163950920105, - "train/contrastive_loss": 1.8903896808624268, - "train/negative_loss": 0.7793095707893372, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.1110800504684448, - "train/total_loss": 0.7132419347763062 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.14903075993061066, - "train/contrastive_loss": 2.4317402839660645, - "train/negative_loss": 1.7178329229354858, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.7139074206352234, - "train/total_loss": 0.6353788375854492 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.17851008474826813, - "train/contrastive_loss": 1.6044678688049316, - "train/negative_loss": 0.5328871607780457, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0715807676315308, - "train/total_loss": 0.4994036555290222 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2292245775461197, - "train/contrastive_loss": 4.995362758636475, - "train/negative_loss": 3.749850034713745, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2455127239227295, - "train/total_loss": 1.2282971143722534 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.08983594179153442, - "train/contrastive_loss": 0.9388681650161743, - "train/negative_loss": 0.8050909638404846, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.1337772160768509, - "train/total_loss": 0.27760958671569824 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.16850288212299347, - "train/contrastive_loss": 1.8879646062850952, - "train/negative_loss": 1.2986431121826172, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.589321494102478, - "train/total_loss": 0.5460957884788513 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.26228269934654236, - "train/contrastive_loss": 2.7020928859710693, - "train/negative_loss": 1.7281032800674438, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.9739896655082703, - "train/total_loss": 0.8027012348175049 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12437035143375397, - "train/contrastive_loss": 1.4505749940872192, - "train/negative_loss": 0.8962615728378296, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5543134212493896, - "train/total_loss": 0.4144853353500366 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1362912505865097, - "train/contrastive_loss": 0.999822199344635, - "train/negative_loss": 0.9981356859207153, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.0016865277430042624, - "train/total_loss": 0.3362556993961334 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2979413866996765, - "train/contrastive_loss": 3.155141830444336, - "train/negative_loss": 1.4392178058624268, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.7159240245819092, - "train/total_loss": 0.9289697408676147 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.13663733005523682, - "train/contrastive_loss": 1.8376799821853638, - "train/negative_loss": 1.3860126733779907, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.45166730880737305, - "train/total_loss": 0.5041733384132385 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.08377191424369812, - "train/contrastive_loss": 0.6757700443267822, - "train/negative_loss": 0.08437209576368332, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.5913979411125183, - "train/total_loss": 0.21892592310905457 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.17227259278297424, - "train/contrastive_loss": 2.8360133171081543, - "train/negative_loss": 2.3279361724853516, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5080772638320923, - "train/total_loss": 0.7394752502441406 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.10940822958946228, - "train/contrastive_loss": 2.6894724369049072, - "train/negative_loss": 2.689211130142212, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0002612533571664244, - "train/total_loss": 0.6473027467727661 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1050514280796051, - "train/contrastive_loss": 1.467414379119873, - "train/negative_loss": 1.4663289785385132, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.0010853888234123588, - "train/total_loss": 0.39853429794311523 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12355905771255493, - "train/contrastive_loss": 0.5843364000320435, - "train/negative_loss": 0.32170039415359497, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.2626360356807709, - "train/total_loss": 0.24042633175849915 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.22168761491775513, - "train/contrastive_loss": 2.957345485687256, - "train/negative_loss": 1.7642492055892944, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.193096399307251, - "train/total_loss": 0.8131567239761353 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.16153278946876526, - "train/contrastive_loss": 0.871544599533081, - "train/negative_loss": 0.21794286370277405, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.6536017656326294, - "train/total_loss": 0.33584171533584595 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2000763714313507, - "train/contrastive_loss": 2.376762866973877, - "train/negative_loss": 1.7546075582504272, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.6221551895141602, - "train/total_loss": 0.6754289865493774 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.13804754614830017, - "train/contrastive_loss": 2.4159562587738037, - "train/negative_loss": 1.5846763849258423, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8312799334526062, - "train/total_loss": 0.6212388277053833 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2350514680147171, - "train/contrastive_loss": 1.8982211351394653, - "train/negative_loss": 0.31204620003700256, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.5861749649047852, - "train/total_loss": 0.6146957278251648 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2496965080499649, - "train/contrastive_loss": 2.717409133911133, - "train/negative_loss": 1.2564703226089478, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.4609389305114746, - "train/total_loss": 0.7931783199310303 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.11457334458827972, - "train/contrastive_loss": 1.1458076238632202, - "train/negative_loss": 0.452790230512619, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6930174231529236, - "train/total_loss": 0.34373486042022705 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.16085779666900635, - "train/contrastive_loss": 0.9832051396369934, - "train/negative_loss": 0.6932693123817444, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.289935827255249, - "train/total_loss": 0.35749882459640503 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.09554963558912277, - "train/contrastive_loss": 1.7714836597442627, - "train/negative_loss": 0.8275248408317566, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9439588189125061, - "train/total_loss": 0.44984638690948486 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2893787920475006, - "train/contrastive_loss": 1.8151218891143799, - "train/negative_loss": 0.31560346484184265, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.4995183944702148, - "train/total_loss": 0.6524031758308411 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2540786564350128, - "train/contrastive_loss": 4.203415870666504, - "train/negative_loss": 1.3638546466827393, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 2.8395609855651855, - "train/total_loss": 1.094761848449707 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1641659438610077, - "train/contrastive_loss": 3.411652088165283, - "train/negative_loss": 2.312633991241455, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.0990180969238281, - "train/total_loss": 0.8464963436126709 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.16859547793865204, - "train/contrastive_loss": 1.3198440074920654, - "train/negative_loss": 0.6633925437927246, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.6564515233039856, - "train/total_loss": 0.43256425857543945 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.20458868145942688, - "train/contrastive_loss": 0.7135464549064636, - "train/negative_loss": 0.5414690375328064, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.17207743227481842, - "train/total_loss": 0.3472979664802551 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.11841384321451187, - "train/contrastive_loss": 2.131989002227783, - "train/negative_loss": 1.43477463722229, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.6972143650054932, - "train/total_loss": 0.5448116660118103 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.22719982266426086, - "train/contrastive_loss": 1.8737785816192627, - "train/negative_loss": 1.1563903093338013, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7173882126808167, - "train/total_loss": 0.6019555330276489 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.20763707160949707, - "train/contrastive_loss": 0.9408699870109558, - "train/negative_loss": 0.9408524632453918, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 1.752391835907474e-05, - "train/total_loss": 0.3958110809326172 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.18446210026741028, - "train/contrastive_loss": 2.3975300788879395, - "train/negative_loss": 1.6703517436981201, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.7271783351898193, - "train/total_loss": 0.6639680862426758 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.20662075281143188, - "train/contrastive_loss": 4.551051139831543, - "train/negative_loss": 2.804849863052368, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.7462012767791748, - "train/total_loss": 1.1168310642242432 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.17557038366794586, - "train/contrastive_loss": 3.6461362838745117, - "train/negative_loss": 1.5018163919448853, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.144320011138916, - "train/total_loss": 0.9047976136207581 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12159689515829086, - "train/contrastive_loss": 1.4067925214767456, - "train/negative_loss": 0.8090495467185974, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5977429747581482, - "train/total_loss": 0.40295541286468506 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.18210750818252563, - "train/contrastive_loss": 1.4862384796142578, - "train/negative_loss": 1.1460953950881958, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.340143084526062, - "train/total_loss": 0.47935521602630615 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.19576576352119446, - "train/contrastive_loss": 3.2953617572784424, - "train/negative_loss": 2.581338405609131, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.7140232920646667, - "train/total_loss": 0.8548381328582764 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.19157135486602783, - "train/contrastive_loss": 2.8093786239624023, - "train/negative_loss": 2.757551670074463, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.051827069371938705, - "train/total_loss": 0.7534471154212952 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1649261862039566, - "train/contrastive_loss": 1.5541354417800903, - "train/negative_loss": 1.0878556966781616, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.4662797451019287, - "train/total_loss": 0.4757533073425293 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.14506405591964722, - "train/contrastive_loss": 2.3942675590515137, - "train/negative_loss": 2.0165863037109375, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.377681165933609, - "train/total_loss": 0.6239175796508789 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.22472748160362244, - "train/contrastive_loss": 1.039717197418213, - "train/negative_loss": 0.1796916425228119, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.8600255846977234, - "train/total_loss": 0.432670921087265 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.13948215544223785, - "train/contrastive_loss": 2.1238226890563965, - "train/negative_loss": 1.044872522354126, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.078950047492981, - "train/total_loss": 0.5642467141151428 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12385927885770798, - "train/contrastive_loss": 1.767095685005188, - "train/negative_loss": 1.1738617420196533, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5932339429855347, - "train/total_loss": 0.4772784411907196 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2831486165523529, - "train/contrastive_loss": 2.5532188415527344, - "train/negative_loss": 0.9639943838119507, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 1.5892243385314941, - "train/total_loss": 0.7937923669815063 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.11027621477842331, - "train/contrastive_loss": 1.1131068468093872, - "train/negative_loss": 1.1131056547164917, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.1622913689279812e-06, - "train/total_loss": 0.3328975737094879 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12585696578025818, - "train/contrastive_loss": 0.29224056005477905, - "train/negative_loss": 0.26478663086891174, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.027453919872641563, - "train/total_loss": 0.1843050718307495 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.07150980830192566, - "train/contrastive_loss": 0.7472353577613831, - "train/negative_loss": 0.6601259112358093, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.08710946142673492, - "train/total_loss": 0.22095687687397003 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.15224318206310272, - "train/contrastive_loss": 0.6254110932350159, - "train/negative_loss": 0.5881865620613098, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.03722451254725456, - "train/total_loss": 0.2773253917694092 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1330820471048355, - "train/contrastive_loss": 2.037640333175659, - "train/negative_loss": 0.8156668543815613, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2219734191894531, - "train/total_loss": 0.540610134601593 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.17759263515472412, - "train/contrastive_loss": 0.4302414357662201, - "train/negative_loss": 0.42499393224716187, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00524749793112278, - "train/total_loss": 0.2636409401893616 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.16675981879234314, - "train/contrastive_loss": 1.5204442739486694, - "train/negative_loss": 1.001295804977417, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5191484689712524, - "train/total_loss": 0.4708486795425415 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.2320711761713028, - "train/contrastive_loss": 3.475731372833252, - "train/negative_loss": 2.812709093093872, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6630222201347351, - "train/total_loss": 0.927217423915863 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.131034716963768, - "train/contrastive_loss": 0.5083518028259277, - "train/negative_loss": 0.2934130132198334, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.21493875980377197, - "train/total_loss": 0.23270508646965027 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.19348406791687012, - "train/contrastive_loss": 2.783698558807373, - "train/negative_loss": 2.1493895053863525, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6343090534210205, - "train/total_loss": 0.7502238154411316 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.25158241391181946, - "train/contrastive_loss": 2.6224541664123535, - "train/negative_loss": 1.409590482711792, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.2128636837005615, - "train/total_loss": 0.7760732173919678 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.22276180982589722, - "train/contrastive_loss": 2.8738763332366943, - "train/negative_loss": 1.3696191310882568, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.5042572021484375, - "train/total_loss": 0.797537088394165 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.17724193632602692, - "train/contrastive_loss": 3.1224632263183594, - "train/negative_loss": 2.720937728881836, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.4015255868434906, - "train/total_loss": 0.8017345666885376 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.245761901140213, - "train/contrastive_loss": 4.053491592407227, - "train/negative_loss": 1.724683165550232, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.328808307647705, - "train/total_loss": 1.0564602613449097 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.24506162106990814, - "train/contrastive_loss": 5.3136491775512695, - "train/negative_loss": 4.340853214263916, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.972795844078064, - "train/total_loss": 1.3077914714813232 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.30460765957832336, - "train/contrastive_loss": 3.4824578762054443, - "train/negative_loss": 1.859214186668396, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.6232436895370483, - "train/total_loss": 1.0010992288589478 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.15134547650814056, - "train/contrastive_loss": 0.7010270357131958, - "train/negative_loss": 0.6990858316421509, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0019411809043958783, - "train/total_loss": 0.291550874710083 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.1653921753168106, - "train/contrastive_loss": 1.5142652988433838, - "train/negative_loss": 0.8623071908950806, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6519580483436584, - "train/total_loss": 0.468245267868042 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.13636566698551178, - "train/contrastive_loss": 1.7412843704223633, - "train/negative_loss": 0.9546482563018799, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.7866360545158386, - "train/total_loss": 0.4846225380897522 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.19187602400779724, - "train/contrastive_loss": 1.4372056722640991, - "train/negative_loss": 1.4372056722640991, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.47931715846061707 - }, - { - "epoch": 13.688212927756654, - "eval_exact_match_accuracy": 0.3523809523809524, - "eval_hamming_loss": 0.06263305322128851, - "eval_loss": 0.5955240726470947, - "eval_macro_f1": 0.4260996486945703, - "eval_macro_precision": 0.5864445744992514, - "eval_macro_recall": 0.3479451478011561, - "eval_micro_f1": 0.6184300341296929, - "eval_micro_precision": 0.773037542662116, - "eval_micro_recall": 0.515358361774744, - "eval_runtime": 2.6261, - "eval_samples_per_second": 199.919, - "eval_steps_per_second": 25.133, - "step": 3600 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.12057598680257797, - "train/contrastive_loss": 0.21088619530200958, - "train/negative_loss": 0.2108125537633896, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 7.364232442341745e-05, - "train/total_loss": 0.16275322437286377 - }, - { - "epoch": 13.688212927756654, - "step": 3600, - "train/classification_loss": 0.08859866857528687, - "train/contrastive_loss": 0.5017707347869873, - "train/negative_loss": 0.24695512652397156, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.25481560826301575, - "train/total_loss": 0.18895281851291656 - }, - { - "epoch": 13.87832699619772, - "grad_norm": 5.867966175079346, - "learning_rate": 1.946012176560122e-05, - "loss": 0.5009, - "step": 3650 - }, - { - "epoch": 13.87832699619772, - "step": 3650, - "train/classification_loss": 0.13166671991348267, - "train/contrastive_loss": 0.35157403349876404, - "train/negative_loss": 0.25834035873413086, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.09323367476463318, - "train/total_loss": 0.2019815295934677 - }, - { - "epoch": 13.87832699619772, - "step": 3650, - "train/classification_loss": 0.12082459032535553, - "train/contrastive_loss": 0.46114468574523926, - "train/negative_loss": 0.3269093632698059, - "train/num_negatives": 44, - "train/num_positives": 4, - "train/positive_loss": 0.13423530757427216, - "train/total_loss": 0.21305352449417114 - }, - { - "epoch": 14.068441064638783, - "grad_norm": 6.448967933654785, - "learning_rate": 1.9452511415525115e-05, - "loss": 0.5115, - "step": 3700 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.3585938811302185, - "train/contrastive_loss": 2.357288360595703, - "train/negative_loss": 0.9972198009490967, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.360068440437317, - "train/total_loss": 0.8300515413284302 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.14021819829940796, - "train/contrastive_loss": 2.0413589477539062, - "train/negative_loss": 1.4158021211624146, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.6255568861961365, - "train/total_loss": 0.5484899878501892 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.163238987326622, - "train/contrastive_loss": 1.234662652015686, - "train/negative_loss": 0.35549384355545044, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8791688084602356, - "train/total_loss": 0.4101715087890625 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.24983720481395721, - "train/contrastive_loss": 2.9556329250335693, - "train/negative_loss": 1.5776840448379517, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.3779488801956177, - "train/total_loss": 0.8409638404846191 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.10700077563524246, - "train/contrastive_loss": 1.5548912286758423, - "train/negative_loss": 0.8523808717727661, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.7025103569030762, - "train/total_loss": 0.41797903180122375 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.18116974830627441, - "train/contrastive_loss": 2.0017848014831543, - "train/negative_loss": 1.2942559719085693, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.7075287699699402, - "train/total_loss": 0.5815267562866211 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2484801858663559, - "train/contrastive_loss": 2.8584702014923096, - "train/negative_loss": 1.670781135559082, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.1876890659332275, - "train/total_loss": 0.8201742768287659 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1368902176618576, - "train/contrastive_loss": 2.3047218322753906, - "train/negative_loss": 1.2378597259521484, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0668621063232422, - "train/total_loss": 0.597834587097168 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.13797473907470703, - "train/contrastive_loss": 1.1777429580688477, - "train/negative_loss": 1.1666278839111328, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.011115024797618389, - "train/total_loss": 0.3735233545303345 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.24447453022003174, - "train/contrastive_loss": 2.2506628036499023, - "train/negative_loss": 1.5210305452346802, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7296321392059326, - "train/total_loss": 0.694607138633728 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.14320158958435059, - "train/contrastive_loss": 1.7561496496200562, - "train/negative_loss": 1.3634506464004517, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3926989734172821, - "train/total_loss": 0.4944315254688263 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1164720207452774, - "train/contrastive_loss": 2.464402198791504, - "train/negative_loss": 1.0083853006362915, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.4560168981552124, - "train/total_loss": 0.6093524694442749 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.15620571374893188, - "train/contrastive_loss": 2.2611591815948486, - "train/negative_loss": 1.8981926441192627, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.36296647787094116, - "train/total_loss": 0.6084375381469727 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.09255626797676086, - "train/contrastive_loss": 2.236625909805298, - "train/negative_loss": 2.236483097076416, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.00014280021423473954, - "train/total_loss": 0.5398814678192139 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.10077201575040817, - "train/contrastive_loss": 1.8419898748397827, - "train/negative_loss": 1.3006126880645752, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.5413771867752075, - "train/total_loss": 0.4691700041294098 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.13361068069934845, - "train/contrastive_loss": 0.9279939532279968, - "train/negative_loss": 0.4377748370170593, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.4902191162109375, - "train/total_loss": 0.3192094564437866 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.21815776824951172, - "train/contrastive_loss": 1.919663667678833, - "train/negative_loss": 1.2536709308624268, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6659927368164062, - "train/total_loss": 0.6020904779434204 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.18154340982437134, - "train/contrastive_loss": 1.599839448928833, - "train/negative_loss": 0.6465356945991516, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.9533037543296814, - "train/total_loss": 0.5015113353729248 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.18521247804164886, - "train/contrastive_loss": 1.2551571130752563, - "train/negative_loss": 0.9995535612106323, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.255603551864624, - "train/total_loss": 0.4362438917160034 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.12444712221622467, - "train/contrastive_loss": 1.4273104667663574, - "train/negative_loss": 0.9677788615226746, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4595315456390381, - "train/total_loss": 0.4099092483520508 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.21046175062656403, - "train/contrastive_loss": 1.5942564010620117, - "train/negative_loss": 0.2673007845878601, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.3269556760787964, - "train/total_loss": 0.5293130278587341 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.24136745929718018, - "train/contrastive_loss": 2.3010289669036865, - "train/negative_loss": 1.4663809537887573, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.8346480131149292, - "train/total_loss": 0.7015732526779175 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1309441775083542, - "train/contrastive_loss": 2.011026382446289, - "train/negative_loss": 0.5773321986198425, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.4336942434310913, - "train/total_loss": 0.5331494808197021 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.14283227920532227, - "train/contrastive_loss": 0.8608816862106323, - "train/negative_loss": 0.61766117811203, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.2432205229997635, - "train/total_loss": 0.31500864028930664 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.09270927309989929, - "train/contrastive_loss": 1.571791172027588, - "train/negative_loss": 0.28793224692344666, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.2838588953018188, - "train/total_loss": 0.40706750750541687 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2889455258846283, - "train/contrastive_loss": 1.2768985033035278, - "train/negative_loss": 0.1658736914396286, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1110248565673828, - "train/total_loss": 0.5443252325057983 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.27027514576911926, - "train/contrastive_loss": 2.862379550933838, - "train/negative_loss": 1.6064236164093018, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2559559345245361, - "train/total_loss": 0.8427510261535645 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.16815300285816193, - "train/contrastive_loss": 4.056977272033691, - "train/negative_loss": 2.9377944469451904, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.1191829442977905, - "train/total_loss": 0.979548454284668 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.21547484397888184, - "train/contrastive_loss": 2.1483607292175293, - "train/negative_loss": 0.969599187374115, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.178761601448059, - "train/total_loss": 0.6451469659805298 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.19543026387691498, - "train/contrastive_loss": 0.8498372435569763, - "train/negative_loss": 0.8272091150283813, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.02262813039124012, - "train/total_loss": 0.36539772152900696 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.10677438974380493, - "train/contrastive_loss": 1.1458441019058228, - "train/negative_loss": 0.4168267250061035, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7290173768997192, - "train/total_loss": 0.33594322204589844 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.21457913517951965, - "train/contrastive_loss": 2.1821365356445312, - "train/negative_loss": 1.0434339046478271, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1387027502059937, - "train/total_loss": 0.6510064601898193 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2613561153411865, - "train/contrastive_loss": 1.524716854095459, - "train/negative_loss": 1.5246975421905518, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 1.9312092263135128e-05, - "train/total_loss": 0.5662994980812073 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.17188237607479095, - "train/contrastive_loss": 0.9483532905578613, - "train/negative_loss": 0.29630550742149353, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.6520477533340454, - "train/total_loss": 0.36155304312705994 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.18231739103794098, - "train/contrastive_loss": 3.1977109909057617, - "train/negative_loss": 1.963308572769165, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.2344025373458862, - "train/total_loss": 0.82185959815979 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.17000621557235718, - "train/contrastive_loss": 2.8481605052948, - "train/negative_loss": 1.2338292598724365, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.6143312454223633, - "train/total_loss": 0.7396383285522461 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.12733139097690582, - "train/contrastive_loss": 1.170665979385376, - "train/negative_loss": 0.7432991862297058, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.4273667633533478, - "train/total_loss": 0.36146458983421326 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1476050764322281, - "train/contrastive_loss": 0.921297550201416, - "train/negative_loss": 0.9212462902069092, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 5.12613078171853e-05, - "train/total_loss": 0.331864595413208 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1800297647714615, - "train/contrastive_loss": 1.9821410179138184, - "train/negative_loss": 1.4661439657211304, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.515997052192688, - "train/total_loss": 0.5764579772949219 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.16493426263332367, - "train/contrastive_loss": 2.026400327682495, - "train/negative_loss": 1.9858546257019043, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.040545638650655746, - "train/total_loss": 0.5702143311500549 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.14359812438488007, - "train/contrastive_loss": 0.7421274185180664, - "train/negative_loss": 0.6859136819839478, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.05621371418237686, - "train/total_loss": 0.29202359914779663 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.17165178060531616, - "train/contrastive_loss": 2.3192543983459473, - "train/negative_loss": 1.4799981117248535, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.8392562866210938, - "train/total_loss": 0.6355026960372925 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2095361351966858, - "train/contrastive_loss": 1.6575994491577148, - "train/negative_loss": 0.3395625948905945, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.3180367946624756, - "train/total_loss": 0.5410560369491577 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.13107185065746307, - "train/contrastive_loss": 1.6554667949676514, - "train/negative_loss": 0.9677079916000366, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.6877588033676147, - "train/total_loss": 0.4621652364730835 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1147797703742981, - "train/contrastive_loss": 1.3863153457641602, - "train/negative_loss": 0.4163660705089569, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9699493050575256, - "train/total_loss": 0.3920428454875946 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.24301372468471527, - "train/contrastive_loss": 0.8343802094459534, - "train/negative_loss": 0.6141822934150696, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.2201979011297226, - "train/total_loss": 0.40988975763320923 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.10232861340045929, - "train/contrastive_loss": 0.6727244853973389, - "train/negative_loss": 0.6727177500724792, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 6.70556073600892e-06, - "train/total_loss": 0.23687350749969482 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1062355637550354, - "train/contrastive_loss": 0.5808340311050415, - "train/negative_loss": 0.3547109067440033, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.2261231243610382, - "train/total_loss": 0.22240236401557922 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.09119691699743271, - "train/contrastive_loss": 1.1844218969345093, - "train/negative_loss": 0.9822262525558472, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.2021956443786621, - "train/total_loss": 0.32808130979537964 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.15053844451904297, - "train/contrastive_loss": 0.45910000801086426, - "train/negative_loss": 0.3428248465061188, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.11627516150474548, - "train/total_loss": 0.24235844612121582 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1229308620095253, - "train/contrastive_loss": 1.690266489982605, - "train/negative_loss": 0.7210255861282349, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9692409038543701, - "train/total_loss": 0.46098417043685913 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1604672372341156, - "train/contrastive_loss": 0.2982664108276367, - "train/negative_loss": 0.29802221059799194, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.00024418841348960996, - "train/total_loss": 0.22012051939964294 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.17570117115974426, - "train/contrastive_loss": 1.755236029624939, - "train/negative_loss": 1.1586592197418213, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5965768098831177, - "train/total_loss": 0.5267484188079834 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2201797068119049, - "train/contrastive_loss": 2.9012749195098877, - "train/negative_loss": 2.253678798675537, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6475960612297058, - "train/total_loss": 0.8004347085952759 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.154937744140625, - "train/contrastive_loss": 1.999124526977539, - "train/negative_loss": 0.5187737345695496, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.4803508520126343, - "train/total_loss": 0.5547626614570618 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.15573161840438843, - "train/contrastive_loss": 2.3865928649902344, - "train/negative_loss": 1.3493322134017944, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0372607707977295, - "train/total_loss": 0.6330502033233643 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.27403977513313293, - "train/contrastive_loss": 3.0870819091796875, - "train/negative_loss": 1.422607421875, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.6644744873046875, - "train/total_loss": 0.891456127166748 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.2262650430202484, - "train/contrastive_loss": 3.509730339050293, - "train/negative_loss": 1.6430470943450928, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8666832447052002, - "train/total_loss": 0.9282110929489136 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.16475172340869904, - "train/contrastive_loss": 2.0731396675109863, - "train/negative_loss": 1.1593363285064697, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.9138032793998718, - "train/total_loss": 0.579379677772522 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.23674167692661285, - "train/contrastive_loss": 3.6376912593841553, - "train/negative_loss": 1.676735281944275, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.9609559774398804, - "train/total_loss": 0.9642799496650696 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.24140577018260956, - "train/contrastive_loss": 3.7778842449188232, - "train/negative_loss": 2.7459001541137695, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0319840908050537, - "train/total_loss": 0.9969826340675354 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.29733774065971375, - "train/contrastive_loss": 3.3896241188049316, - "train/negative_loss": 1.7102601528167725, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.6793640851974487, - "train/total_loss": 0.9752625226974487 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.14177097380161285, - "train/contrastive_loss": 0.6974367499351501, - "train/negative_loss": 0.6967818140983582, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0006549169775098562, - "train/total_loss": 0.28125834465026855 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.1639096587896347, - "train/contrastive_loss": 1.398608684539795, - "train/negative_loss": 0.7461845278739929, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6524240970611572, - "train/total_loss": 0.4436314105987549 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.12120488286018372, - "train/contrastive_loss": 1.4893848896026611, - "train/negative_loss": 0.7995643019676208, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.6898205280303955, - "train/total_loss": 0.4190818667411804 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.18646278977394104, - "train/contrastive_loss": 1.8487077951431274, - "train/negative_loss": 1.8487077951431274, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5562043190002441 - }, - { - "epoch": 14.068441064638783, - "eval_exact_match_accuracy": 0.35619047619047617, - "eval_hamming_loss": 0.06296918767507002, - "eval_loss": 0.5496504306793213, - "eval_macro_f1": 0.4183811717065943, - "eval_macro_precision": 0.5769104598564752, - "eval_macro_recall": 0.3414795859502789, - "eval_micro_f1": 0.6102635228848821, - "eval_micro_precision": 0.7815275310834814, - "eval_micro_recall": 0.5005688282138794, - "eval_runtime": 2.6302, - "eval_samples_per_second": 199.601, - "eval_steps_per_second": 25.093, - "step": 3700 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.096537284553051, - "train/contrastive_loss": 0.5358088612556458, - "train/negative_loss": 0.057345788925886154, - "train/num_negatives": 30, - "train/num_positives": 18, - "train/positive_loss": 0.4784630835056305, - "train/total_loss": 0.2036990523338318 - }, - { - "epoch": 14.068441064638783, - "step": 3700, - "train/classification_loss": 0.0830332413315773, - "train/contrastive_loss": 0.46615293622016907, - "train/negative_loss": 0.4659242331981659, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.00022869113308843225, - "train/total_loss": 0.17626383900642395 - }, - { - "epoch": 14.258555133079849, - "grad_norm": 5.382350444793701, - "learning_rate": 1.9444901065449013e-05, - "loss": 0.4669, - "step": 3750 - }, - { - "epoch": 14.258555133079849, - "step": 3750, - "train/classification_loss": 0.11861798167228699, - "train/contrastive_loss": 0.3972126245498657, - "train/negative_loss": 0.369985431432724, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.027227208018302917, - "train/total_loss": 0.1980605125427246 - }, - { - "epoch": 14.258555133079849, - "step": 3750, - "train/classification_loss": 0.10711941868066788, - "train/contrastive_loss": 0.4406331181526184, - "train/negative_loss": 0.37734484672546387, - "train/num_negatives": 40, - "train/num_positives": 8, - "train/positive_loss": 0.06328826397657394, - "train/total_loss": 0.19524604082107544 - }, - { - "epoch": 14.448669201520913, - "grad_norm": 7.8520097732543945, - "learning_rate": 1.943729071537291e-05, - "loss": 0.4524, - "step": 3800 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.3062390387058258, - "train/contrastive_loss": 2.185359477996826, - "train/negative_loss": 0.7890573740005493, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.3963021039962769, - "train/total_loss": 0.7433109283447266 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.16075290739536285, - "train/contrastive_loss": 2.283289909362793, - "train/negative_loss": 1.2548671960830688, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.0284227132797241, - "train/total_loss": 0.6174108982086182 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17344963550567627, - "train/contrastive_loss": 1.2401823997497559, - "train/negative_loss": 0.11001575738191605, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1301666498184204, - "train/total_loss": 0.42148613929748535 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.24602924287319183, - "train/contrastive_loss": 3.3006856441497803, - "train/negative_loss": 1.900410771369934, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4002748727798462, - "train/total_loss": 0.9061663746833801 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1011304184794426, - "train/contrastive_loss": 1.7049965858459473, - "train/negative_loss": 1.1815415620803833, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5234549641609192, - "train/total_loss": 0.4421297609806061 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17130064964294434, - "train/contrastive_loss": 1.760608196258545, - "train/negative_loss": 1.3269312381744385, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.43367692828178406, - "train/total_loss": 0.5234223008155823 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.2553638815879822, - "train/contrastive_loss": 3.0276124477386475, - "train/negative_loss": 2.04402756690979, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.9835849404335022, - "train/total_loss": 0.8608863949775696 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.13498912751674652, - "train/contrastive_loss": 2.102015733718872, - "train/negative_loss": 1.4098832607269287, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6921325325965881, - "train/total_loss": 0.5553922653198242 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.14662112295627594, - "train/contrastive_loss": 1.2642680406570435, - "train/negative_loss": 0.9616250991821289, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.30264294147491455, - "train/total_loss": 0.39947474002838135 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.2825922966003418, - "train/contrastive_loss": 3.306548833847046, - "train/negative_loss": 2.1055309772491455, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2010178565979004, - "train/total_loss": 0.9439020752906799 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1682652235031128, - "train/contrastive_loss": 2.603313446044922, - "train/negative_loss": 1.6491104364395142, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.9542031288146973, - "train/total_loss": 0.688927948474884 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.12206681817770004, - "train/contrastive_loss": 2.2216687202453613, - "train/negative_loss": 0.9688575267791748, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.252811312675476, - "train/total_loss": 0.5664005875587463 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.16437393426895142, - "train/contrastive_loss": 2.5142040252685547, - "train/negative_loss": 1.684278130531311, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8299258351325989, - "train/total_loss": 0.6672147512435913 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.08824069797992706, - "train/contrastive_loss": 1.7730432748794556, - "train/negative_loss": 1.7729753255844116, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 6.793637294322252e-05, - "train/total_loss": 0.442849338054657 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.10005499422550201, - "train/contrastive_loss": 1.0647850036621094, - "train/negative_loss": 0.9825038313865662, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.08228122442960739, - "train/total_loss": 0.3130120038986206 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.14749962091445923, - "train/contrastive_loss": 1.5817294120788574, - "train/negative_loss": 0.7299968600273132, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.8517325520515442, - "train/total_loss": 0.46384552121162415 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.24657268822193146, - "train/contrastive_loss": 2.539597511291504, - "train/negative_loss": 1.1398730278015137, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.3997244834899902, - "train/total_loss": 0.7544921636581421 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.18413294851779938, - "train/contrastive_loss": 1.1241651773452759, - "train/negative_loss": 0.2498588263988495, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.874306321144104, - "train/total_loss": 0.4089660048484802 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17222169041633606, - "train/contrastive_loss": 1.1046503782272339, - "train/negative_loss": 0.6956959366798401, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.4089544713497162, - "train/total_loss": 0.39315176010131836 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.15270979702472687, - "train/contrastive_loss": 1.999328851699829, - "train/negative_loss": 1.6335686445236206, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.3657602071762085, - "train/total_loss": 0.5525755882263184 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.2245589643716812, - "train/contrastive_loss": 1.7727773189544678, - "train/negative_loss": 0.26955822110176086, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.5032191276550293, - "train/total_loss": 0.5791144371032715 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.25176551938056946, - "train/contrastive_loss": 3.1813888549804688, - "train/negative_loss": 1.3817564249038696, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.7996325492858887, - "train/total_loss": 0.8880432844161987 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1250697821378708, - "train/contrastive_loss": 1.9951462745666504, - "train/negative_loss": 0.5371652245521545, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.4579811096191406, - "train/total_loss": 0.5240990519523621 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17136652767658234, - "train/contrastive_loss": 1.9851714372634888, - "train/negative_loss": 0.7440030574798584, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 1.2411683797836304, - "train/total_loss": 0.5684008002281189 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.08082704991102219, - "train/contrastive_loss": 1.154155969619751, - "train/negative_loss": 0.18534831702709198, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.9688076376914978, - "train/total_loss": 0.31165823340415955 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.3060009479522705, - "train/contrastive_loss": 1.6742417812347412, - "train/negative_loss": 0.19492240250110626, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.4793193340301514, - "train/total_loss": 0.6408493518829346 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.2620938718318939, - "train/contrastive_loss": 3.0984442234039307, - "train/negative_loss": 1.1848738193511963, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.9135704040527344, - "train/total_loss": 0.8817827701568604 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17955489456653595, - "train/contrastive_loss": 3.904538154602051, - "train/negative_loss": 2.5380468368530273, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.3664911985397339, - "train/total_loss": 0.9604625105857849 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.18529272079467773, - "train/contrastive_loss": 1.4992948770523071, - "train/negative_loss": 0.7462634444236755, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.7530314326286316, - "train/total_loss": 0.4851517081260681 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.21719060838222504, - "train/contrastive_loss": 1.0487416982650757, - "train/negative_loss": 0.6513720154762268, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.39736971259117126, - "train/total_loss": 0.4269389510154724 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.10896074026823044, - "train/contrastive_loss": 1.4730846881866455, - "train/negative_loss": 0.7471706867218018, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.725913941860199, - "train/total_loss": 0.40357768535614014 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.23961152136325836, - "train/contrastive_loss": 2.2325878143310547, - "train/negative_loss": 0.9586185812950134, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.273969292640686, - "train/total_loss": 0.686129093170166 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.26686325669288635, - "train/contrastive_loss": 1.1205928325653076, - "train/negative_loss": 1.1205586194992065, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 3.421365181566216e-05, - "train/total_loss": 0.4909818172454834 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1609576791524887, - "train/contrastive_loss": 0.4306389093399048, - "train/negative_loss": 0.4155276119709015, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.015111301094293594, - "train/total_loss": 0.24708545207977295 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.21477676928043365, - "train/contrastive_loss": 3.754474639892578, - "train/negative_loss": 2.6876907348632812, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.0667839050292969, - "train/total_loss": 0.965671718120575 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.18476934731006622, - "train/contrastive_loss": 3.160276412963867, - "train/negative_loss": 1.222172737121582, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.9381036758422852, - "train/total_loss": 0.8168246150016785 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.11324022710323334, - "train/contrastive_loss": 0.9753639698028564, - "train/negative_loss": 0.4928487241268158, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.48251521587371826, - "train/total_loss": 0.3083130121231079 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1572825163602829, - "train/contrastive_loss": 1.523755669593811, - "train/negative_loss": 0.9093173146247864, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.6144383549690247, - "train/total_loss": 0.46203362941741943 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.187114879488945, - "train/contrastive_loss": 2.1459832191467285, - "train/negative_loss": 1.6753500699996948, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.4706330895423889, - "train/total_loss": 0.6163115501403809 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.17688573896884918, - "train/contrastive_loss": 1.9834625720977783, - "train/negative_loss": 1.9754489660263062, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.008013621903955936, - "train/total_loss": 0.5735782384872437 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.16251137852668762, - "train/contrastive_loss": 0.8155778050422668, - "train/negative_loss": 0.6359920501708984, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1795857548713684, - "train/total_loss": 0.325626939535141 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1716797649860382, - "train/contrastive_loss": 2.554873466491699, - "train/negative_loss": 1.77324378490448, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.7816295623779297, - "train/total_loss": 0.6826545000076294 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.2091578096151352, - "train/contrastive_loss": 1.7601925134658813, - "train/negative_loss": 0.2519100606441498, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5082824230194092, - "train/total_loss": 0.5611963272094727 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.15349727869033813, - "train/contrastive_loss": 2.067821502685547, - "train/negative_loss": 1.5504039525985718, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.5174174308776855, - "train/total_loss": 0.5670615434646606 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1314135491847992, - "train/contrastive_loss": 1.0533554553985596, - "train/negative_loss": 0.4734005928039551, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5799548625946045, - "train/total_loss": 0.3420846462249756 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.25785017013549805, - "train/contrastive_loss": 1.5223362445831299, - "train/negative_loss": 0.9469765424728394, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.5753597617149353, - "train/total_loss": 0.562317430973053 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.10839135199785233, - "train/contrastive_loss": 1.0327470302581787, - "train/negative_loss": 1.032745361328125, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.6391295503126457e-06, - "train/total_loss": 0.31494075059890747 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.11359640955924988, - "train/contrastive_loss": 0.6042802929878235, - "train/negative_loss": 0.46675872802734375, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.13752156496047974, - "train/total_loss": 0.23445247113704681 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.08429799973964691, - "train/contrastive_loss": 0.9004032015800476, - "train/negative_loss": 0.7683170437812805, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1320861428976059, - "train/total_loss": 0.2643786370754242 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1647275984287262, - "train/contrastive_loss": 1.0542041063308716, - "train/negative_loss": 0.11776397377252579, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.936440110206604, - "train/total_loss": 0.3755684196949005 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1325555145740509, - "train/contrastive_loss": 2.068944215774536, - "train/negative_loss": 0.6023449897766113, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.4665992259979248, - "train/total_loss": 0.5463443994522095 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.16165950894355774, - "train/contrastive_loss": 0.38613298535346985, - "train/negative_loss": 0.37860965728759766, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.007523315958678722, - "train/total_loss": 0.23888611793518066 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.19301104545593262, - "train/contrastive_loss": 2.145570755004883, - "train/negative_loss": 0.85423743724823, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2913331985473633, - "train/total_loss": 0.6221252083778381 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.24178367853164673, - "train/contrastive_loss": 2.9034204483032227, - "train/negative_loss": 2.2676076889038086, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6358126401901245, - "train/total_loss": 0.8224678039550781 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.1830739676952362, - "train/contrastive_loss": 1.3913649320602417, - "train/negative_loss": 0.5251762866973877, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.866188645362854, - "train/total_loss": 0.46134695410728455 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.18298429250717163, - "train/contrastive_loss": 3.124505043029785, - "train/negative_loss": 2.0903475284576416, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0341575145721436, - "train/total_loss": 0.8078852891921997 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.27472949028015137, - "train/contrastive_loss": 4.080432415008545, - "train/negative_loss": 1.6464099884033203, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.4340224266052246, - "train/total_loss": 1.0908160209655762 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.22943443059921265, - "train/contrastive_loss": 3.4157774448394775, - "train/negative_loss": 1.7785943746566772, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.6371830701828003, - "train/total_loss": 0.9125899076461792 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.20551109313964844, - "train/contrastive_loss": 3.842533588409424, - "train/negative_loss": 2.7224040031433105, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.1201294660568237, - "train/total_loss": 0.9740177989006042 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.26164236664772034, - "train/contrastive_loss": 4.160204887390137, - "train/negative_loss": 1.8117133378982544, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.3484914302825928, - "train/total_loss": 1.0936833620071411 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.26982381939888, - "train/contrastive_loss": 3.1407065391540527, - "train/negative_loss": 1.89778470993042, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.2429217100143433, - "train/total_loss": 0.8979651927947998 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.29960042238235474, - "train/contrastive_loss": 3.4313464164733887, - "train/negative_loss": 1.5429683923721313, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.8883781433105469, - "train/total_loss": 0.9858697056770325 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.13738934695720673, - "train/contrastive_loss": 0.5442332625389099, - "train/negative_loss": 0.5433416366577148, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0008916151127777994, - "train/total_loss": 0.24623599648475647 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.163521409034729, - "train/contrastive_loss": 1.4566795825958252, - "train/negative_loss": 0.6876731514930725, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7690064311027527, - "train/total_loss": 0.45485731959342957 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.10544067621231079, - "train/contrastive_loss": 1.290706753730774, - "train/negative_loss": 0.3771025240421295, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.913604199886322, - "train/total_loss": 0.363582044839859 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.18259546160697937, - "train/contrastive_loss": 1.5786157846450806, - "train/negative_loss": 1.5786157846450806, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.498318612575531 - }, - { - "epoch": 14.448669201520913, - "eval_exact_match_accuracy": 0.3504761904761905, - "eval_hamming_loss": 0.06386554621848739, - "eval_loss": 0.5876179337501526, - "eval_macro_f1": 0.42793034338810054, - "eval_macro_precision": 0.5814088584534831, - "eval_macro_recall": 0.3511485481754247, - "eval_micro_f1": 0.6085164835164835, - "eval_micro_precision": 0.7677642980935875, - "eval_micro_recall": 0.5039817974971559, - "eval_runtime": 2.6378, - "eval_samples_per_second": 199.031, - "eval_steps_per_second": 25.021, - "step": 3800 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.10698747634887695, - "train/contrastive_loss": 0.6779773235321045, - "train/negative_loss": 0.6776981949806213, - "train/num_negatives": 44, - "train/num_positives": 4, - "train/positive_loss": 0.00027911626966670156, - "train/total_loss": 0.24258294701576233 - }, - { - "epoch": 14.448669201520913, - "step": 3800, - "train/classification_loss": 0.09332019835710526, - "train/contrastive_loss": 0.5264272689819336, - "train/negative_loss": 0.5225359201431274, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.00389133021235466, - "train/total_loss": 0.19860565662384033 - }, - { - "epoch": 14.638783269961976, - "grad_norm": 4.863008975982666, - "learning_rate": 1.9429680365296806e-05, - "loss": 0.435, - "step": 3850 - }, - { - "epoch": 14.638783269961976, - "step": 3850, - "train/classification_loss": 0.09339234232902527, - "train/contrastive_loss": 0.4513559937477112, - "train/negative_loss": 0.44969916343688965, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.0016568414866924286, - "train/total_loss": 0.18366354703903198 - }, - { - "epoch": 14.638783269961976, - "step": 3850, - "train/classification_loss": 0.0771065354347229, - "train/contrastive_loss": 0.39081481099128723, - "train/negative_loss": 0.3742498755455017, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.016564946621656418, - "train/total_loss": 0.15526950359344482 - }, - { - "epoch": 14.828897338403042, - "grad_norm": 17.885530471801758, - "learning_rate": 1.94220700152207e-05, - "loss": 0.4378, - "step": 3900 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.394266813993454, - "train/contrastive_loss": 2.6207096576690674, - "train/negative_loss": 1.6182979345321655, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.0024117231369019, - "train/total_loss": 0.9184087514877319 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1897570639848709, - "train/contrastive_loss": 2.029060125350952, - "train/negative_loss": 0.9938766360282898, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 1.0351834297180176, - "train/total_loss": 0.5955690741539001 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.17677249014377594, - "train/contrastive_loss": 1.1501284837722778, - "train/negative_loss": 0.31066983938217163, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8394586443901062, - "train/total_loss": 0.40679818391799927 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2678215503692627, - "train/contrastive_loss": 2.8522138595581055, - "train/negative_loss": 1.6054117679595947, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2468022108078003, - "train/total_loss": 0.8382643461227417 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.09829790890216827, - "train/contrastive_loss": 1.3839068412780762, - "train/negative_loss": 0.9960927963256836, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.3878140151500702, - "train/total_loss": 0.37507927417755127 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.17423026263713837, - "train/contrastive_loss": 1.445080280303955, - "train/negative_loss": 1.2088016271591187, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.23627862334251404, - "train/total_loss": 0.46324634552001953 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.30008646845817566, - "train/contrastive_loss": 2.5774364471435547, - "train/negative_loss": 1.5744563341140747, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.0029799938201904, - "train/total_loss": 0.8155738115310669 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.15255676209926605, - "train/contrastive_loss": 2.0274674892425537, - "train/negative_loss": 1.6093159914016724, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.41815146803855896, - "train/total_loss": 0.558050274848938 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1526375114917755, - "train/contrastive_loss": 1.1701189279556274, - "train/negative_loss": 1.0256824493408203, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.14443644881248474, - "train/total_loss": 0.3866612911224365 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2811201214790344, - "train/contrastive_loss": 2.9274020195007324, - "train/negative_loss": 1.730527400970459, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1968746185302734, - "train/total_loss": 0.866600513458252 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16317002475261688, - "train/contrastive_loss": 2.300529718399048, - "train/negative_loss": 1.4821341037750244, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8183955550193787, - "train/total_loss": 0.6232759952545166 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.11182282865047455, - "train/contrastive_loss": 1.752679467201233, - "train/negative_loss": 0.8125652074813843, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9401142597198486, - "train/total_loss": 0.4623587131500244 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1814967840909958, - "train/contrastive_loss": 3.1441032886505127, - "train/negative_loss": 1.5704139471054077, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.573689341545105, - "train/total_loss": 0.8103174567222595 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.08513619750738144, - "train/contrastive_loss": 1.411559820175171, - "train/negative_loss": 1.4115501642227173, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 9.700799637357704e-06, - "train/total_loss": 0.36744818091392517 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.08792739361524582, - "train/contrastive_loss": 0.9813827276229858, - "train/negative_loss": 0.9732238054275513, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.00815893430262804, - "train/total_loss": 0.2842039465904236 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.15712441504001617, - "train/contrastive_loss": 1.330417275428772, - "train/negative_loss": 0.6294429302215576, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.7009743452072144, - "train/total_loss": 0.4232078790664673 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.23208510875701904, - "train/contrastive_loss": 2.7436749935150146, - "train/negative_loss": 1.554756999015808, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.1889179944992065, - "train/total_loss": 0.7808201313018799 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1849457323551178, - "train/contrastive_loss": 1.5054194927215576, - "train/negative_loss": 0.44826632738113403, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.0571532249450684, - "train/total_loss": 0.48602962493896484 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2202039211988449, - "train/contrastive_loss": 1.3865563869476318, - "train/negative_loss": 0.9317866563796997, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.45476970076560974, - "train/total_loss": 0.4975152015686035 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1420762985944748, - "train/contrastive_loss": 1.4330520629882812, - "train/negative_loss": 0.5621968507766724, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8708551526069641, - "train/total_loss": 0.4286867380142212 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1971278190612793, - "train/contrastive_loss": 1.5878738164901733, - "train/negative_loss": 0.21098336577415466, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.3768904209136963, - "train/total_loss": 0.514702558517456 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.261755108833313, - "train/contrastive_loss": 3.050969123840332, - "train/negative_loss": 1.374698281288147, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.6762707233428955, - "train/total_loss": 0.8719489574432373 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.14939266443252563, - "train/contrastive_loss": 1.9096521139144897, - "train/negative_loss": 0.4996696710586548, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 1.409982442855835, - "train/total_loss": 0.5313230752944946 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.17558440566062927, - "train/contrastive_loss": 1.9998366832733154, - "train/negative_loss": 0.6790288686752319, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 1.3208078145980835, - "train/total_loss": 0.5755517482757568 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.08311566710472107, - "train/contrastive_loss": 1.0017133951187134, - "train/negative_loss": 0.2408026158809662, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7609107494354248, - "train/total_loss": 0.2834583520889282 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.29441380500793457, - "train/contrastive_loss": 1.9426779747009277, - "train/negative_loss": 0.5035298466682434, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.439148187637329, - "train/total_loss": 0.682949423789978 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2529418468475342, - "train/contrastive_loss": 2.4353294372558594, - "train/negative_loss": 1.3680797815322876, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0672495365142822, - "train/total_loss": 0.740007758140564 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2177269011735916, - "train/contrastive_loss": 3.995924472808838, - "train/negative_loss": 2.8830678462982178, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.1128566265106201, - "train/total_loss": 1.0169118642807007 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2335851937532425, - "train/contrastive_loss": 2.029794692993164, - "train/negative_loss": 0.8915490508079529, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.1382455825805664, - "train/total_loss": 0.6395441293716431 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.19482383131980896, - "train/contrastive_loss": 0.6574403047561646, - "train/negative_loss": 0.31776291131973267, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.3396773636341095, - "train/total_loss": 0.3263118863105774 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.11349548399448395, - "train/contrastive_loss": 1.1691443920135498, - "train/negative_loss": 0.2711946964263916, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.8979496359825134, - "train/total_loss": 0.3473243713378906 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.22807511687278748, - "train/contrastive_loss": 3.0166239738464355, - "train/negative_loss": 1.3877484798431396, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.628875494003296, - "train/total_loss": 0.8313999176025391 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2782997786998749, - "train/contrastive_loss": 0.9439955353736877, - "train/negative_loss": 0.943882405757904, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00011313601862639189, - "train/total_loss": 0.4670988917350769 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16927890479564667, - "train/contrastive_loss": 0.6784379482269287, - "train/negative_loss": 0.5189102292060852, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.1595277190208435, - "train/total_loss": 0.3049665093421936 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.18913479149341583, - "train/contrastive_loss": 2.894742965698242, - "train/negative_loss": 2.384521484375, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.510221540927887, - "train/total_loss": 0.768083393573761 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16906112432479858, - "train/contrastive_loss": 1.9948381185531616, - "train/negative_loss": 1.0575437545776367, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 0.9372943639755249, - "train/total_loss": 0.5680287480354309 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1362282633781433, - "train/contrastive_loss": 1.843801498413086, - "train/negative_loss": 1.358138918876648, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.4856625199317932, - "train/total_loss": 0.5049885511398315 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.15526895225048065, - "train/contrastive_loss": 1.315871238708496, - "train/negative_loss": 1.0460760593414307, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.26979517936706543, - "train/total_loss": 0.4184432029724121 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1844026893377304, - "train/contrastive_loss": 1.6059988737106323, - "train/negative_loss": 1.546562671661377, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.05943620204925537, - "train/total_loss": 0.5056024789810181 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.17908938229084015, - "train/contrastive_loss": 1.6576762199401855, - "train/negative_loss": 1.594594120979309, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.06308204680681229, - "train/total_loss": 0.5106246471405029 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16896852850914001, - "train/contrastive_loss": 0.9785975813865662, - "train/negative_loss": 0.9470379948616028, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.03155956789851189, - "train/total_loss": 0.36468803882598877 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.19261521100997925, - "train/contrastive_loss": 2.3568642139434814, - "train/negative_loss": 1.5460195541381836, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.8108446598052979, - "train/total_loss": 0.6639880537986755 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.196249321103096, - "train/contrastive_loss": 1.9670652151107788, - "train/negative_loss": 0.42847633361816406, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5385888814926147, - "train/total_loss": 0.5896623730659485 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1542297750711441, - "train/contrastive_loss": 2.435218334197998, - "train/negative_loss": 1.5135787725448608, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.921639621257782, - "train/total_loss": 0.6412734389305115 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.17397333681583405, - "train/contrastive_loss": 1.1902811527252197, - "train/negative_loss": 0.39526987075805664, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.7950112223625183, - "train/total_loss": 0.41202956438064575 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.24566319584846497, - "train/contrastive_loss": 1.597927451133728, - "train/negative_loss": 0.7173250913619995, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.8806023597717285, - "train/total_loss": 0.5652487277984619 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1028580367565155, - "train/contrastive_loss": 0.855050802230835, - "train/negative_loss": 0.8550111055374146, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 3.969823592342436e-05, - "train/total_loss": 0.273868203163147 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.13580796122550964, - "train/contrastive_loss": 1.5875253677368164, - "train/negative_loss": 0.5982151031494141, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9893102645874023, - "train/total_loss": 0.45331305265426636 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.0983162522315979, - "train/contrastive_loss": 1.2443861961364746, - "train/negative_loss": 1.05070960521698, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.19367654621601105, - "train/total_loss": 0.34719347953796387 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16068191826343536, - "train/contrastive_loss": 1.3775705099105835, - "train/negative_loss": 0.5374722480773926, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.8400982618331909, - "train/total_loss": 0.4361960291862488 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.11592218279838562, - "train/contrastive_loss": 1.7635583877563477, - "train/negative_loss": 0.5463334321975708, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2172249555587769, - "train/total_loss": 0.46863386034965515 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1724414825439453, - "train/contrastive_loss": 0.6267135143280029, - "train/negative_loss": 0.5144782662391663, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.11223524808883667, - "train/total_loss": 0.2977842092514038 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1938094198703766, - "train/contrastive_loss": 3.306283950805664, - "train/negative_loss": 1.1695865392684937, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 2.136697292327881, - "train/total_loss": 0.855066180229187 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2053905427455902, - "train/contrastive_loss": 1.6975270509719849, - "train/negative_loss": 0.812495768070221, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8850312829017639, - "train/total_loss": 0.5448959469795227 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.19586370885372162, - "train/contrastive_loss": 1.6630618572235107, - "train/negative_loss": 0.41531142592430115, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.2477504014968872, - "train/total_loss": 0.5284760594367981 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.16826051473617554, - "train/contrastive_loss": 2.9900503158569336, - "train/negative_loss": 1.8261727094650269, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1638774871826172, - "train/total_loss": 0.7662705779075623 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.2725692093372345, - "train/contrastive_loss": 3.968104839324951, - "train/negative_loss": 1.4416202306747437, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.526484489440918, - "train/total_loss": 1.066190242767334 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.24045336246490479, - "train/contrastive_loss": 4.026223182678223, - "train/negative_loss": 1.9213581085205078, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.104865074157715, - "train/total_loss": 1.0456979274749756 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1621697098016739, - "train/contrastive_loss": 2.578885793685913, - "train/negative_loss": 1.892559289932251, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6863265037536621, - "train/total_loss": 0.6779468655586243 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.24779574573040009, - "train/contrastive_loss": 4.381435871124268, - "train/negative_loss": 1.7022870779037476, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.6791489124298096, - "train/total_loss": 1.1240829229354858 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.29708367586135864, - "train/contrastive_loss": 3.374786853790283, - "train/negative_loss": 1.9625520706176758, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.412234902381897, - "train/total_loss": 0.9720410704612732 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.29975366592407227, - "train/contrastive_loss": 3.1363792419433594, - "train/negative_loss": 1.484134554862976, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.6522445678710938, - "train/total_loss": 0.927029550075531 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.14046238362789154, - "train/contrastive_loss": 0.6531795263290405, - "train/negative_loss": 0.6530122756958008, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00016727847105357796, - "train/total_loss": 0.2710982859134674 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.166677787899971, - "train/contrastive_loss": 1.529881477355957, - "train/negative_loss": 0.7055662274360657, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8243153095245361, - "train/total_loss": 0.4726541042327881 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.11187603324651718, - "train/contrastive_loss": 1.1815879344940186, - "train/negative_loss": 0.33619600534439087, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.8453918695449829, - "train/total_loss": 0.34819361567497253 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.1977161169052124, - "train/contrastive_loss": 1.9805055856704712, - "train/negative_loss": 1.9805055856704712, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5938172340393066 - }, - { - "epoch": 14.828897338403042, - "eval_exact_match_accuracy": 0.32761904761904764, - "eval_hamming_loss": 0.06610644257703081, - "eval_loss": 0.5833454728126526, - "eval_macro_f1": 0.4129100225419429, - "eval_macro_precision": 0.5747398896364787, - "eval_macro_recall": 0.33451412243369216, - "eval_micro_f1": 0.5874125874125874, - "eval_micro_precision": 0.7622504537205081, - "eval_micro_recall": 0.4778156996587031, - "eval_runtime": 2.6414, - "eval_samples_per_second": 198.757, - "eval_steps_per_second": 24.987, - "step": 3900 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.10299953073263168, - "train/contrastive_loss": 0.5087851881980896, - "train/negative_loss": 0.3286198079586029, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.1801653951406479, - "train/total_loss": 0.20475657284259796 - }, - { - "epoch": 14.828897338403042, - "step": 3900, - "train/classification_loss": 0.11027241498231888, - "train/contrastive_loss": 0.23736700415611267, - "train/negative_loss": 0.23690275847911835, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.0004642516141757369, - "train/total_loss": 0.15774580836296082 - }, - { - "epoch": 15.019011406844106, - "grad_norm": 4.70112419128418, - "learning_rate": 1.94144596651446e-05, - "loss": 0.4853, - "step": 3950 - }, - { - "epoch": 15.019011406844106, - "step": 3950, - "train/classification_loss": 0.09927143901586533, - "train/contrastive_loss": 0.3796497881412506, - "train/negative_loss": 0.34694865345954895, - "train/num_negatives": 40, - "train/num_positives": 12, - "train/positive_loss": 0.03270113095641136, - "train/total_loss": 0.1752014011144638 - }, - { - "epoch": 15.019011406844106, - "step": 3950, - "train/classification_loss": 0.11699184030294418, - "train/contrastive_loss": 1.1100807189941406, - "train/negative_loss": 1.1100637912750244, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.692787918727845e-05, - "train/total_loss": 0.3390079736709595 - }, - { - "epoch": 15.209125475285171, - "grad_norm": 8.164756774902344, - "learning_rate": 1.9406849315068493e-05, - "loss": 0.4541, - "step": 4000 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.31831061840057373, - "train/contrastive_loss": 1.8275189399719238, - "train/negative_loss": 0.5465643405914307, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.2809545993804932, - "train/total_loss": 0.6838144063949585 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.13335134088993073, - "train/contrastive_loss": 1.5934499502182007, - "train/negative_loss": 1.2008392810821533, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.392610639333725, - "train/total_loss": 0.4520413279533386 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16266579926013947, - "train/contrastive_loss": 0.5755535364151001, - "train/negative_loss": 0.13597719371318817, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.43957632780075073, - "train/total_loss": 0.2777765095233917 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.2366701066493988, - "train/contrastive_loss": 3.0598762035369873, - "train/negative_loss": 2.1107096672058105, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9491665363311768, - "train/total_loss": 0.8486453294754028 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.09049591422080994, - "train/contrastive_loss": 2.0517184734344482, - "train/negative_loss": 1.8461123704910278, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.20560602843761444, - "train/total_loss": 0.5008395910263062 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16123728454113007, - "train/contrastive_loss": 1.870987057685852, - "train/negative_loss": 1.4527429342269897, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.4182441532611847, - "train/total_loss": 0.5354347229003906 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.22481949627399445, - "train/contrastive_loss": 2.932222843170166, - "train/negative_loss": 2.0993454456329346, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.832877516746521, - "train/total_loss": 0.8112640380859375 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.14473530650138855, - "train/contrastive_loss": 1.6290743350982666, - "train/negative_loss": 1.2610183954238892, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.36805596947669983, - "train/total_loss": 0.47055017948150635 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1404017210006714, - "train/contrastive_loss": 1.0525003671646118, - "train/negative_loss": 1.042894721031189, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.009605659171938896, - "train/total_loss": 0.3509017825126648 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.36655712127685547, - "train/contrastive_loss": 2.794285297393799, - "train/negative_loss": 1.383866786956787, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4104186296463013, - "train/total_loss": 0.9254142045974731 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1779036670923233, - "train/contrastive_loss": 2.2664239406585693, - "train/negative_loss": 1.608270287513733, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6581536531448364, - "train/total_loss": 0.6311884522438049 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.09741813689470291, - "train/contrastive_loss": 0.8767304420471191, - "train/negative_loss": 0.2354012429714203, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.6413291692733765, - "train/total_loss": 0.2727642357349396 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16655026376247406, - "train/contrastive_loss": 1.9470635652542114, - "train/negative_loss": 1.7739654779434204, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.17309807240962982, - "train/total_loss": 0.5559629797935486 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.07385476678609848, - "train/contrastive_loss": 1.5081878900527954, - "train/negative_loss": 1.508181095123291, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 6.809883416281082e-06, - "train/total_loss": 0.3754923641681671 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.09319930523633957, - "train/contrastive_loss": 1.4435793161392212, - "train/negative_loss": 1.4434871673583984, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 9.2112306447234e-05, - "train/total_loss": 0.3819151818752289 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16001160442829132, - "train/contrastive_loss": 1.0968210697174072, - "train/negative_loss": 0.5457438826560974, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.5510771870613098, - "train/total_loss": 0.3793758153915405 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.23007063567638397, - "train/contrastive_loss": 2.0981826782226562, - "train/negative_loss": 1.0236819982528687, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.074500560760498, - "train/total_loss": 0.6497071981430054 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1730884611606598, - "train/contrastive_loss": 0.9470776915550232, - "train/negative_loss": 0.2766163945198059, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.6704612970352173, - "train/total_loss": 0.3625040054321289 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16473345458507538, - "train/contrastive_loss": 1.1057584285736084, - "train/negative_loss": 0.6207022070884705, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.48505622148513794, - "train/total_loss": 0.3858851492404938 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.13508440554141998, - "train/contrastive_loss": 1.3749454021453857, - "train/negative_loss": 0.8764373660087585, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4985080361366272, - "train/total_loss": 0.41007351875305176 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.21221117675304413, - "train/contrastive_loss": 1.546924352645874, - "train/negative_loss": 0.24166329205036163, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.3052610158920288, - "train/total_loss": 0.5215960741043091 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.21989329159259796, - "train/contrastive_loss": 1.8462920188903809, - "train/negative_loss": 1.3062174320220947, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.5400746464729309, - "train/total_loss": 0.5891516804695129 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.12188639491796494, - "train/contrastive_loss": 0.8784916400909424, - "train/negative_loss": 0.3427370488643646, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.5357545614242554, - "train/total_loss": 0.2975847125053406 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1490432769060135, - "train/contrastive_loss": 1.0939316749572754, - "train/negative_loss": 0.535412073135376, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.5585196614265442, - "train/total_loss": 0.3678296208381653 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.085634745657444, - "train/contrastive_loss": 1.2096298933029175, - "train/negative_loss": 0.3494751751422882, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8601547479629517, - "train/total_loss": 0.3275607228279114 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.2925473749637604, - "train/contrastive_loss": 1.6645604372024536, - "train/negative_loss": 0.5261334180831909, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1384270191192627, - "train/total_loss": 0.6254594326019287 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.2984907925128937, - "train/contrastive_loss": 2.930392265319824, - "train/negative_loss": 1.572022795677185, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3583693504333496, - "train/total_loss": 0.8845692873001099 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16958162188529968, - "train/contrastive_loss": 3.5781164169311523, - "train/negative_loss": 2.510838270187378, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.067278265953064, - "train/total_loss": 0.8852049112319946 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.19607992470264435, - "train/contrastive_loss": 1.0964759588241577, - "train/negative_loss": 0.7994586825370789, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.29701724648475647, - "train/total_loss": 0.41537511348724365 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.21995891630649567, - "train/contrastive_loss": 0.9817628860473633, - "train/negative_loss": 0.7990974187850952, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.18266548216342926, - "train/total_loss": 0.41631150245666504 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.09785909205675125, - "train/contrastive_loss": 0.901837944984436, - "train/negative_loss": 0.6756097674369812, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.22622820734977722, - "train/total_loss": 0.27822667360305786 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.20741568505764008, - "train/contrastive_loss": 2.7758612632751465, - "train/negative_loss": 1.635964274406433, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1398969888687134, - "train/total_loss": 0.7625879645347595 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.19241014122962952, - "train/contrastive_loss": 0.536547064781189, - "train/negative_loss": 0.5364866256713867, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 6.0440936067607254e-05, - "train/total_loss": 0.29971957206726074 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1621273010969162, - "train/contrastive_loss": 0.897975742816925, - "train/negative_loss": 0.7912145853042603, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.1067611426115036, - "train/total_loss": 0.3417224586009979 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.22004684805870056, - "train/contrastive_loss": 3.7179555892944336, - "train/negative_loss": 2.7791237831115723, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.9388318657875061, - "train/total_loss": 0.9636379480361938 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.17330750823020935, - "train/contrastive_loss": 2.421257734298706, - "train/negative_loss": 1.3040580749511719, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.1171996593475342, - "train/total_loss": 0.6575590372085571 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1054597944021225, - "train/contrastive_loss": 0.7655807733535767, - "train/negative_loss": 0.621974766254425, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.14360599219799042, - "train/total_loss": 0.2585759460926056 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.12962166965007782, - "train/contrastive_loss": 0.9480772614479065, - "train/negative_loss": 0.9128456711769104, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.03523160517215729, - "train/total_loss": 0.3192371129989624 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.1728668361902237, - "train/contrastive_loss": 1.5216861963272095, - "train/negative_loss": 1.5097633600234985, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.011922825127840042, - "train/total_loss": 0.4772040843963623 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.20010799169540405, - "train/contrastive_loss": 2.8767614364624023, - "train/negative_loss": 2.4863779544830322, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.3903835117816925, - "train/total_loss": 0.7754603028297424 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.15349648892879486, - "train/contrastive_loss": 1.39593505859375, - "train/negative_loss": 0.8526375889778137, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5432974100112915, - "train/total_loss": 0.432683527469635 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.15187996625900269, - "train/contrastive_loss": 2.220020055770874, - "train/negative_loss": 1.8805991411209106, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.33942094445228577, - "train/total_loss": 0.5958839654922485 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.18421272933483124, - "train/contrastive_loss": 1.1461260318756104, - "train/negative_loss": 0.33583664894104004, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 0.8102893829345703, - "train/total_loss": 0.41343793272972107 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.16465787589550018, - "train/contrastive_loss": 2.6446895599365234, - "train/negative_loss": 1.4790427684783936, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.1656467914581299, - "train/total_loss": 0.693595826625824 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.12112986296415329, - "train/contrastive_loss": 1.0477752685546875, - "train/negative_loss": 0.5989039540290833, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.44887128472328186, - "train/total_loss": 0.33068493008613586 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.27668771147727966, - "train/contrastive_loss": 1.486797571182251, - "train/negative_loss": 0.628089189529419, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.858708381652832, - "train/total_loss": 0.5740472078323364 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.11773277819156647, - "train/contrastive_loss": 0.9411860108375549, - "train/negative_loss": 0.9411842226982117, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7583390672371024e-06, - "train/total_loss": 0.3059699833393097 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.10701647400856018, - "train/contrastive_loss": 0.46986544132232666, - "train/negative_loss": 0.22990040481090546, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.2399650514125824, - "train/total_loss": 0.20098957419395447 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.09836211055517197, - "train/contrastive_loss": 1.2475292682647705, - "train/negative_loss": 1.225046992301941, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.02248232811689377, - "train/total_loss": 0.3478679656982422 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.17283697426319122, - "train/contrastive_loss": 2.023157835006714, - "train/negative_loss": 1.7550384998321533, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.26811930537223816, - "train/total_loss": 0.5774685740470886 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.12034578621387482, - "train/contrastive_loss": 1.5970724821090698, - "train/negative_loss": 0.6533419489860535, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9437305331230164, - "train/total_loss": 0.4397602677345276 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.148742213845253, - "train/contrastive_loss": 0.30038902163505554, - "train/negative_loss": 0.2943606972694397, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.006028316915035248, - "train/total_loss": 0.20882001519203186 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.18175338208675385, - "train/contrastive_loss": 1.7332215309143066, - "train/negative_loss": 1.0083814859390259, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7248400449752808, - "train/total_loss": 0.5283976793289185 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.21441631019115448, - "train/contrastive_loss": 1.4899265766143799, - "train/negative_loss": 1.0607644319534302, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.42916208505630493, - "train/total_loss": 0.5124016404151917 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.12293386459350586, - "train/contrastive_loss": 0.2791917026042938, - "train/negative_loss": 0.18882489204406738, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.09036680310964584, - "train/total_loss": 0.1787722110748291 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.18471963703632355, - "train/contrastive_loss": 2.7449405193328857, - "train/negative_loss": 1.9758869409561157, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.76905357837677, - "train/total_loss": 0.7337077260017395 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.28619709610939026, - "train/contrastive_loss": 3.5339159965515137, - "train/negative_loss": 1.6381322145462036, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.89578378200531, - "train/total_loss": 0.9929803609848022 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.2411699891090393, - "train/contrastive_loss": 3.618514060974121, - "train/negative_loss": 1.8727037906646729, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7458103895187378, - "train/total_loss": 0.9648728370666504 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.13980531692504883, - "train/contrastive_loss": 1.638691782951355, - "train/negative_loss": 1.5997514724731445, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.038940317928791046, - "train/total_loss": 0.46754369139671326 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.2492377609014511, - "train/contrastive_loss": 4.221097946166992, - "train/negative_loss": 1.7969151735305786, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.424182891845703, - "train/total_loss": 1.0934573411941528 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.26087453961372375, - "train/contrastive_loss": 4.5903000831604, - "train/negative_loss": 3.7146172523498535, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.8756827116012573, - "train/total_loss": 1.1789345741271973 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.29934144020080566, - "train/contrastive_loss": 3.3080620765686035, - "train/negative_loss": 1.866834282875061, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.4412277936935425, - "train/total_loss": 0.9609538912773132 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.13907906413078308, - "train/contrastive_loss": 0.7659385800361633, - "train/negative_loss": 0.7608644366264343, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.005074169486761093, - "train/total_loss": 0.2922667860984802 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.14159752428531647, - "train/contrastive_loss": 1.0898241996765137, - "train/negative_loss": 0.4403412640094757, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6494829654693604, - "train/total_loss": 0.35956236720085144 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.10488314926624298, - "train/contrastive_loss": 1.0389996767044067, - "train/negative_loss": 0.5078248381614685, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.5311748385429382, - "train/total_loss": 0.31268310546875 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.18270820379257202, - "train/contrastive_loss": 1.5003291368484497, - "train/negative_loss": 1.5003291368484497, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.4827740490436554 - }, - { - "epoch": 15.209125475285171, - "eval_exact_match_accuracy": 0.3580952380952381, - "eval_hamming_loss": 0.06274509803921569, - "eval_loss": 0.5291520357131958, - "eval_macro_f1": 0.44319492345134515, - "eval_macro_precision": 0.5827890201340296, - "eval_macro_recall": 0.37270872473801914, - "eval_micro_f1": 0.6281540504648074, - "eval_micro_precision": 0.7543859649122807, - "eval_micro_recall": 0.5381114903299203, - "eval_runtime": 2.625, - "eval_samples_per_second": 200.002, - "eval_steps_per_second": 25.143, - "step": 4000 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.052484918385744095, - "train/contrastive_loss": 0.3793196678161621, - "train/negative_loss": 0.3683813810348511, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.010938283056020737, - "train/total_loss": 0.12834885716438293 - }, - { - "epoch": 15.209125475285171, - "step": 4000, - "train/classification_loss": 0.07262670993804932, - "train/contrastive_loss": 0.36192047595977783, - "train/negative_loss": 0.23034629225730896, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 0.13157419860363007, - "train/total_loss": 0.1450107991695404 - }, - { - "epoch": 15.399239543726235, - "grad_norm": 9.501413345336914, - "learning_rate": 1.939923896499239e-05, - "loss": 0.4292, - "step": 4050 - }, - { - "epoch": 15.399239543726235, - "step": 4050, - "train/classification_loss": 0.10132987052202225, - "train/contrastive_loss": 0.24914270639419556, - "train/negative_loss": 0.24905771017074585, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 8.499122486682609e-05, - "train/total_loss": 0.151158407330513 - }, - { - "epoch": 15.399239543726235, - "step": 4050, - "train/classification_loss": 0.17752884328365326, - "train/contrastive_loss": 0.9157673120498657, - "train/negative_loss": 0.4796258509159088, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.4361414611339569, - "train/total_loss": 0.36068230867385864 - }, - { - "epoch": 15.5893536121673, - "grad_norm": 3.8831286430358887, - "learning_rate": 1.939178082191781e-05, - "loss": 0.423, - "step": 4100 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.34076157212257385, - "train/contrastive_loss": 2.035186767578125, - "train/negative_loss": 0.42538508772850037, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.6098017692565918, - "train/total_loss": 0.7477989196777344 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.13123323023319244, - "train/contrastive_loss": 1.6573704481124878, - "train/negative_loss": 1.2360913753509521, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.42127910256385803, - "train/total_loss": 0.4627073407173157 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.15777191519737244, - "train/contrastive_loss": 0.9119049310684204, - "train/negative_loss": 0.16825896501541138, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.743645966053009, - "train/total_loss": 0.34015291929244995 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.24343878030776978, - "train/contrastive_loss": 4.204609394073486, - "train/negative_loss": 3.150953531265259, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.0536558628082275, - "train/total_loss": 1.0843605995178223 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.08485651016235352, - "train/contrastive_loss": 1.9600156545639038, - "train/negative_loss": 1.769433617591858, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.19058199226856232, - "train/total_loss": 0.4768596589565277 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1581645905971527, - "train/contrastive_loss": 1.5791651010513306, - "train/negative_loss": 1.0905532836914062, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.48861178755760193, - "train/total_loss": 0.4739976227283478 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.22507594525814056, - "train/contrastive_loss": 2.7628142833709717, - "train/negative_loss": 1.7965131998062134, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.9663011431694031, - "train/total_loss": 0.777638852596283 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.12396249920129776, - "train/contrastive_loss": 1.8084228038787842, - "train/negative_loss": 1.28127920627594, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5271435976028442, - "train/total_loss": 0.485647052526474 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1403028815984726, - "train/contrastive_loss": 1.3483251333236694, - "train/negative_loss": 1.332473635673523, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.01585150510072708, - "train/total_loss": 0.40996789932250977 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2996567487716675, - "train/contrastive_loss": 2.625196695327759, - "train/negative_loss": 1.4283382892608643, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1968584060668945, - "train/total_loss": 0.8246961236000061 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16081120073795319, - "train/contrastive_loss": 2.0177457332611084, - "train/negative_loss": 1.6912635564804077, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.3264821469783783, - "train/total_loss": 0.5643603801727295 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.10472220927476883, - "train/contrastive_loss": 1.219502329826355, - "train/negative_loss": 0.3059333860874176, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.913568913936615, - "train/total_loss": 0.3486226797103882 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.15734955668449402, - "train/contrastive_loss": 1.702951431274414, - "train/negative_loss": 1.5832023620605469, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.11974909156560898, - "train/total_loss": 0.4979398548603058 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.08943256735801697, - "train/contrastive_loss": 2.6881062984466553, - "train/negative_loss": 2.685537576675415, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0025687413290143013, - "train/total_loss": 0.6270538568496704 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.09695737808942795, - "train/contrastive_loss": 1.5052509307861328, - "train/negative_loss": 0.7637326121330261, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.7415183186531067, - "train/total_loss": 0.3980075716972351 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.11806848645210266, - "train/contrastive_loss": 0.5351139903068542, - "train/negative_loss": 0.5045150518417358, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.030598938465118408, - "train/total_loss": 0.22509127855300903 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.21546192467212677, - "train/contrastive_loss": 1.4631508588790894, - "train/negative_loss": 0.8686181902885437, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5945326685905457, - "train/total_loss": 0.5080921053886414 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.163499116897583, - "train/contrastive_loss": 0.7278239130973816, - "train/negative_loss": 0.2997356653213501, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.4280882477760315, - "train/total_loss": 0.3090639114379883 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.19600144028663635, - "train/contrastive_loss": 2.280444622039795, - "train/negative_loss": 1.3032047748565674, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.977239727973938, - "train/total_loss": 0.6520903706550598 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.12281271815299988, - "train/contrastive_loss": 1.5790340900421143, - "train/negative_loss": 0.38444480299949646, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.1945892572402954, - "train/total_loss": 0.43861955404281616 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.18955294787883759, - "train/contrastive_loss": 0.887004017829895, - "train/negative_loss": 0.2006487101316452, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 0.6863552927970886, - "train/total_loss": 0.3669537603855133 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2319905161857605, - "train/contrastive_loss": 1.5380680561065674, - "train/negative_loss": 1.165163278579712, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.37290483713150024, - "train/total_loss": 0.539604127407074 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.12262660264968872, - "train/contrastive_loss": 0.8656572699546814, - "train/negative_loss": 0.2794332504272461, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.5862240195274353, - "train/total_loss": 0.29575806856155396 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1398412138223648, - "train/contrastive_loss": 1.2208163738250732, - "train/negative_loss": 0.4643104672431946, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.7565059661865234, - "train/total_loss": 0.38400447368621826 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.0766678974032402, - "train/contrastive_loss": 0.705133318901062, - "train/negative_loss": 0.23477311432361603, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.4703602194786072, - "train/total_loss": 0.21769455075263977 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.28178805112838745, - "train/contrastive_loss": 2.2222418785095215, - "train/negative_loss": 0.6060993075370789, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.6161425113677979, - "train/total_loss": 0.7262364625930786 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.28985998034477234, - "train/contrastive_loss": 2.758349657058716, - "train/negative_loss": 1.3769497871398926, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3813998699188232, - "train/total_loss": 0.8415299654006958 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.17861206829547882, - "train/contrastive_loss": 3.712977647781372, - "train/negative_loss": 2.770890712738037, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.942086935043335, - "train/total_loss": 0.92120760679245 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.17899057269096375, - "train/contrastive_loss": 1.525565266609192, - "train/negative_loss": 0.6474210023880005, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8781442642211914, - "train/total_loss": 0.48410362005233765 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.20677293837070465, - "train/contrastive_loss": 0.8936482667922974, - "train/negative_loss": 0.5181020498275757, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.3755462169647217, - "train/total_loss": 0.38550257682800293 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1091718077659607, - "train/contrastive_loss": 1.4851458072662354, - "train/negative_loss": 0.5882835388183594, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.896862268447876, - "train/total_loss": 0.40620097517967224 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.20171897113323212, - "train/contrastive_loss": 2.6505088806152344, - "train/negative_loss": 1.3575785160064697, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2929303646087646, - "train/total_loss": 0.7318207621574402 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.19383573532104492, - "train/contrastive_loss": 0.5299912691116333, - "train/negative_loss": 0.5292276740074158, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0007635885267518461, - "train/total_loss": 0.2998339831829071 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.18022450804710388, - "train/contrastive_loss": 1.1833536624908447, - "train/negative_loss": 0.5121380090713501, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.6712157130241394, - "train/total_loss": 0.4168952405452728 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2297990471124649, - "train/contrastive_loss": 4.2775163650512695, - "train/negative_loss": 2.895548105239868, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.3819684982299805, - "train/total_loss": 1.0853023529052734 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.19537891447544098, - "train/contrastive_loss": 3.6429100036621094, - "train/negative_loss": 2.0491247177124023, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.5937851667404175, - "train/total_loss": 0.9239609241485596 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.10518279671669006, - "train/contrastive_loss": 0.2784043550491333, - "train/negative_loss": 0.19037498533725739, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.08802936226129532, - "train/total_loss": 0.16086366772651672 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.154654398560524, - "train/contrastive_loss": 0.9095209836959839, - "train/negative_loss": 0.889610767364502, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.019910242408514023, - "train/total_loss": 0.33655858039855957 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.18328402936458588, - "train/contrastive_loss": 1.8156219720840454, - "train/negative_loss": 1.7003884315490723, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.11523357033729553, - "train/total_loss": 0.5464084148406982 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.19871588051319122, - "train/contrastive_loss": 2.353888988494873, - "train/negative_loss": 2.255964517593384, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.09792443364858627, - "train/total_loss": 0.6694936752319336 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.17807379364967346, - "train/contrastive_loss": 2.014467477798462, - "train/negative_loss": 1.4164310693740845, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5980363488197327, - "train/total_loss": 0.5809673070907593 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16239649057388306, - "train/contrastive_loss": 2.5983662605285645, - "train/negative_loss": 1.8397549390792847, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.758611261844635, - "train/total_loss": 0.6820697784423828 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1939525306224823, - "train/contrastive_loss": 1.7354676723480225, - "train/negative_loss": 0.5247897505760193, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.210677981376648, - "train/total_loss": 0.5410460829734802 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.17871801555156708, - "train/contrastive_loss": 3.259268045425415, - "train/negative_loss": 1.344139575958252, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.915128469467163, - "train/total_loss": 0.8305716514587402 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1298266351222992, - "train/contrastive_loss": 0.6541414260864258, - "train/negative_loss": 0.2652236819267273, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.3889177441596985, - "train/total_loss": 0.26065492630004883 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2771438658237457, - "train/contrastive_loss": 1.52113938331604, - "train/negative_loss": 0.7476596236228943, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.7734798192977905, - "train/total_loss": 0.5813717842102051 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.10849671065807343, - "train/contrastive_loss": 1.002732753753662, - "train/negative_loss": 1.0027318000793457, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 9.238724487659056e-07, - "train/total_loss": 0.3090432584285736 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.11843731999397278, - "train/contrastive_loss": 0.8353102207183838, - "train/negative_loss": 0.18875548243522644, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.6465547680854797, - "train/total_loss": 0.28549936413764954 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.11189188808202744, - "train/contrastive_loss": 1.7843576669692993, - "train/negative_loss": 1.353553056716919, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.430804580450058, - "train/total_loss": 0.46876344084739685 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16889089345932007, - "train/contrastive_loss": 2.6725571155548096, - "train/negative_loss": 2.3909754753112793, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.2815815508365631, - "train/total_loss": 0.7034023404121399 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.12248165160417557, - "train/contrastive_loss": 1.767439603805542, - "train/negative_loss": 0.35389459133148193, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.41354501247406, - "train/total_loss": 0.4759695827960968 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16037432849407196, - "train/contrastive_loss": 0.32347914576530457, - "train/negative_loss": 0.30229324102401733, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.02118591219186783, - "train/total_loss": 0.22507014870643616 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16544586420059204, - "train/contrastive_loss": 1.233327865600586, - "train/negative_loss": 0.6125301122665405, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6207978129386902, - "train/total_loss": 0.41211146116256714 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2080453485250473, - "train/contrastive_loss": 2.872901678085327, - "train/negative_loss": 2.461361885070801, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.41153988242149353, - "train/total_loss": 0.7826257348060608 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.16247789561748505, - "train/contrastive_loss": 0.6756911277770996, - "train/negative_loss": 0.26833662390708923, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.4073545038700104, - "train/total_loss": 0.2976161241531372 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.18817932903766632, - "train/contrastive_loss": 2.812286376953125, - "train/negative_loss": 2.162795066833496, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.6494911909103394, - "train/total_loss": 0.7506365776062012 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.27096232771873474, - "train/contrastive_loss": 3.4288604259490967, - "train/negative_loss": 1.6826035976409912, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.7462568283081055, - "train/total_loss": 0.9567344188690186 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.22645337879657745, - "train/contrastive_loss": 2.6377315521240234, - "train/negative_loss": 1.833013892173767, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.8047177195549011, - "train/total_loss": 0.7539997100830078 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.15168236196041107, - "train/contrastive_loss": 2.799431800842285, - "train/negative_loss": 2.7075164318084717, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.09191534668207169, - "train/total_loss": 0.7115687727928162 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2378636598587036, - "train/contrastive_loss": 3.8400588035583496, - "train/negative_loss": 1.843161940574646, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.996896743774414, - "train/total_loss": 1.0058753490447998 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.2764231264591217, - "train/contrastive_loss": 5.267734050750732, - "train/negative_loss": 3.9424314498901367, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.3253024816513062, - "train/total_loss": 1.329969882965088 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.3202246427536011, - "train/contrastive_loss": 3.2392160892486572, - "train/negative_loss": 2.0570974349975586, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.1821186542510986, - "train/total_loss": 0.9680678844451904 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1308726966381073, - "train/contrastive_loss": 0.6919634342193604, - "train/negative_loss": 0.6916763186454773, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0002871381875593215, - "train/total_loss": 0.26926538348197937 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.13871154189109802, - "train/contrastive_loss": 1.2202831506729126, - "train/negative_loss": 0.17946861684322357, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.0408145189285278, - "train/total_loss": 0.3827681541442871 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.08856913447380066, - "train/contrastive_loss": 0.5836161375045776, - "train/negative_loss": 0.4512704908847809, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.13234567642211914, - "train/total_loss": 0.20529237389564514 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.1792525202035904, - "train/contrastive_loss": 1.4160962104797363, - "train/negative_loss": 1.4160962104797363, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.46247178316116333 - }, - { - "epoch": 15.5893536121673, - "eval_exact_match_accuracy": 0.35619047619047617, - "eval_hamming_loss": 0.06240896358543417, - "eval_loss": 0.555469810962677, - "eval_macro_f1": 0.43829743374261526, - "eval_macro_precision": 0.5856181397078473, - "eval_macro_recall": 0.36471552593279477, - "eval_micro_f1": 0.6249158249158249, - "eval_micro_precision": 0.7656765676567657, - "eval_micro_recall": 0.5278725824800911, - "eval_runtime": 2.6285, - "eval_samples_per_second": 199.731, - "eval_steps_per_second": 25.109, - "step": 4100 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.11456893384456635, - "train/contrastive_loss": 0.4320535361766815, - "train/negative_loss": 0.4320389926433563, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.4543638826580718e-05, - "train/total_loss": 0.20097965002059937 - }, - { - "epoch": 15.5893536121673, - "step": 4100, - "train/classification_loss": 0.06852655112743378, - "train/contrastive_loss": 0.26524150371551514, - "train/negative_loss": 0.2359706610441208, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.029270857572555542, - "train/total_loss": 0.12157484889030457 - }, - { - "epoch": 15.779467680608365, - "grad_norm": 3.0254623889923096, - "learning_rate": 1.9384170471841707e-05, - "loss": 0.4506, - "step": 4150 - }, - { - "epoch": 15.779467680608365, - "step": 4150, - "train/classification_loss": 0.05558672919869423, - "train/contrastive_loss": 0.3125383257865906, - "train/negative_loss": 0.2911210060119629, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.02141733467578888, - "train/total_loss": 0.11809439957141876 - }, - { - "epoch": 15.779467680608365, - "step": 4150, - "train/classification_loss": 0.0684405043721199, - "train/contrastive_loss": 0.332396537065506, - "train/negative_loss": 0.31319501996040344, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.019201528280973434, - "train/total_loss": 0.13491982221603394 - }, - { - "epoch": 15.96958174904943, - "grad_norm": 6.299551963806152, - "learning_rate": 1.93765601217656e-05, - "loss": 0.4367, - "step": 4200 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.39304298162460327, - "train/contrastive_loss": 2.8759288787841797, - "train/negative_loss": 0.8945333361625671, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.9813954830169678, - "train/total_loss": 0.9682287573814392 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.13965536653995514, - "train/contrastive_loss": 1.6844475269317627, - "train/negative_loss": 1.0448664426803589, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.639581024646759, - "train/total_loss": 0.4765448570251465 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.17304709553718567, - "train/contrastive_loss": 0.903866171836853, - "train/negative_loss": 0.3067138195037842, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.5971523523330688, - "train/total_loss": 0.3538203239440918 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2493240088224411, - "train/contrastive_loss": 2.4782824516296387, - "train/negative_loss": 1.111737608909607, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.3665447235107422, - "train/total_loss": 0.74498051404953 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.10098738968372345, - "train/contrastive_loss": 1.9218403100967407, - "train/negative_loss": 1.153903603553772, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.7679367065429688, - "train/total_loss": 0.4853554368019104 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.17858591675758362, - "train/contrastive_loss": 1.50437593460083, - "train/negative_loss": 1.2698147296905518, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.2345612347126007, - "train/total_loss": 0.47946110367774963 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.24548275768756866, - "train/contrastive_loss": 2.316471815109253, - "train/negative_loss": 1.5855680704116821, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.730903685092926, - "train/total_loss": 0.708777129650116 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.15483780205249786, - "train/contrastive_loss": 2.074988842010498, - "train/negative_loss": 1.2959930896759033, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7789958119392395, - "train/total_loss": 0.5698356032371521 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.13324083387851715, - "train/contrastive_loss": 1.0362879037857056, - "train/negative_loss": 0.9728291630744934, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.06345871090888977, - "train/total_loss": 0.3404984176158905 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.28053784370422363, - "train/contrastive_loss": 3.2293813228607178, - "train/negative_loss": 1.5390743017196655, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.6903070211410522, - "train/total_loss": 0.9264141321182251 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.17056122422218323, - "train/contrastive_loss": 2.3028688430786133, - "train/negative_loss": 1.6609878540039062, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.641880989074707, - "train/total_loss": 0.6311349868774414 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.11556490510702133, - "train/contrastive_loss": 1.8315448760986328, - "train/negative_loss": 0.46392887830734253, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.367616057395935, - "train/total_loss": 0.48187389969825745 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.15666617453098297, - "train/contrastive_loss": 3.347996234893799, - "train/negative_loss": 1.7132210731506348, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.6347752809524536, - "train/total_loss": 0.8262653946876526 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.06881032884120941, - "train/contrastive_loss": 0.7923529148101807, - "train/negative_loss": 0.7923445105552673, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 8.374521712539718e-06, - "train/total_loss": 0.22728091478347778 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.09347039461135864, - "train/contrastive_loss": 1.337019443511963, - "train/negative_loss": 1.0091006755828857, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.3279188275337219, - "train/total_loss": 0.3608742952346802 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.14595384895801544, - "train/contrastive_loss": 1.5792487859725952, - "train/negative_loss": 0.6616594195365906, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.9175893664360046, - "train/total_loss": 0.4618036150932312 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.20979034900665283, - "train/contrastive_loss": 2.3456859588623047, - "train/negative_loss": 1.3005441427230835, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.0451416969299316, - "train/total_loss": 0.6789275407791138 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1908547431230545, - "train/contrastive_loss": 1.2160483598709106, - "train/negative_loss": 0.4783741235733032, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7376742362976074, - "train/total_loss": 0.43406441807746887 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.18466845154762268, - "train/contrastive_loss": 2.23915433883667, - "train/negative_loss": 1.0577951669692993, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 1.1813591718673706, - "train/total_loss": 0.6324993371963501 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1220412403345108, - "train/contrastive_loss": 1.4693225622177124, - "train/negative_loss": 0.20591166615486145, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.2634109258651733, - "train/total_loss": 0.41590577363967896 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.17632335424423218, - "train/contrastive_loss": 1.2353554964065552, - "train/negative_loss": 0.25415435433387756, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 0.9812011122703552, - "train/total_loss": 0.42339444160461426 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2538376450538635, - "train/contrastive_loss": 1.5405552387237549, - "train/negative_loss": 0.8102543950080872, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.730300784111023, - "train/total_loss": 0.5619486570358276 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1182360127568245, - "train/contrastive_loss": 1.239654779434204, - "train/negative_loss": 0.29731637239456177, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9423384666442871, - "train/total_loss": 0.36616697907447815 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.15356388688087463, - "train/contrastive_loss": 1.1521828174591064, - "train/negative_loss": 0.17328016459941864, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.9789026379585266, - "train/total_loss": 0.3840004503726959 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.08620686829090118, - "train/contrastive_loss": 1.7430689334869385, - "train/negative_loss": 0.6376668810844421, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.1054021120071411, - "train/total_loss": 0.43482065200805664 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2999720871448517, - "train/contrastive_loss": 2.011557102203369, - "train/negative_loss": 0.7517892718315125, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.259767770767212, - "train/total_loss": 0.702283501625061 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.26612719893455505, - "train/contrastive_loss": 2.7970950603485107, - "train/negative_loss": 1.570884108543396, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2262109518051147, - "train/total_loss": 0.8255462646484375 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2066144198179245, - "train/contrastive_loss": 4.158864974975586, - "train/negative_loss": 3.0721120834350586, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.0867527723312378, - "train/total_loss": 1.038387417793274 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.22993718087673187, - "train/contrastive_loss": 1.997867465019226, - "train/negative_loss": 0.754845142364502, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.2430223226547241, - "train/total_loss": 0.6295107007026672 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.22107331454753876, - "train/contrastive_loss": 0.9667313098907471, - "train/negative_loss": 0.7394149303436279, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.22731640934944153, - "train/total_loss": 0.41441959142684937 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.09840701520442963, - "train/contrastive_loss": 1.1778833866119385, - "train/negative_loss": 0.6438666582107544, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5340166687965393, - "train/total_loss": 0.3339836895465851 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.19604399800300598, - "train/contrastive_loss": 2.779995918273926, - "train/negative_loss": 1.3819321393966675, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3980638980865479, - "train/total_loss": 0.7520432472229004 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2549751102924347, - "train/contrastive_loss": 1.043469786643982, - "train/negative_loss": 1.0433307886123657, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00013900769408792257, - "train/total_loss": 0.4636690616607666 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16063085198402405, - "train/contrastive_loss": 0.6260595321655273, - "train/negative_loss": 0.5757052302360535, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.050354279577732086, - "train/total_loss": 0.28584277629852295 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.18915767967700958, - "train/contrastive_loss": 3.1302027702331543, - "train/negative_loss": 2.384493589401245, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7457091808319092, - "train/total_loss": 0.8151982426643372 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.17359033226966858, - "train/contrastive_loss": 2.697814464569092, - "train/negative_loss": 1.1504735946655273, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.5473408699035645, - "train/total_loss": 0.7131532430648804 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.11559001356363297, - "train/contrastive_loss": 0.9747823476791382, - "train/negative_loss": 0.49559760093688965, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.47918471693992615, - "train/total_loss": 0.31054648756980896 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1308848261833191, - "train/contrastive_loss": 1.1848864555358887, - "train/negative_loss": 1.1842565536499023, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.000629921443760395, - "train/total_loss": 0.36786210536956787 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.18416613340377808, - "train/contrastive_loss": 1.9673517942428589, - "train/negative_loss": 1.609407901763916, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.35794389247894287, - "train/total_loss": 0.5776364803314209 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16737736761569977, - "train/contrastive_loss": 2.345773935317993, - "train/negative_loss": 2.3166861534118652, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.029087860137224197, - "train/total_loss": 0.636532187461853 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.20127594470977783, - "train/contrastive_loss": 2.2918944358825684, - "train/negative_loss": 1.4114402532577515, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.8804543018341064, - "train/total_loss": 0.6596548557281494 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1790463924407959, - "train/contrastive_loss": 2.5263569355010986, - "train/negative_loss": 2.017500877380371, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.5088559985160828, - "train/total_loss": 0.6843177676200867 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.20979300141334534, - "train/contrastive_loss": 1.534686803817749, - "train/negative_loss": 0.32220298051834106, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.2124838829040527, - "train/total_loss": 0.5167303681373596 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.14904052019119263, - "train/contrastive_loss": 2.2664103507995605, - "train/negative_loss": 0.9704191088676453, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.29599130153656, - "train/total_loss": 0.6023225784301758 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.10684115439653397, - "train/contrastive_loss": 1.3275146484375, - "train/negative_loss": 0.6002274751663208, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.727287232875824, - "train/total_loss": 0.37234407663345337 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2500471770763397, - "train/contrastive_loss": 0.7612115740776062, - "train/negative_loss": 0.7061457633972168, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.05506581813097, - "train/total_loss": 0.4022895097732544 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.09715240448713303, - "train/contrastive_loss": 0.835587739944458, - "train/negative_loss": 0.8355861902236938, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.5497223557758844e-06, - "train/total_loss": 0.26426994800567627 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.13551850616931915, - "train/contrastive_loss": 1.7327635288238525, - "train/negative_loss": 0.5851315855979919, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1476320028305054, - "train/total_loss": 0.4820712208747864 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.09357018023729324, - "train/contrastive_loss": 1.1101911067962646, - "train/negative_loss": 1.044621229171753, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.06556981801986694, - "train/total_loss": 0.315608412027359 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16342556476593018, - "train/contrastive_loss": 1.1024041175842285, - "train/negative_loss": 0.5642703175544739, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.5381337404251099, - "train/total_loss": 0.38390639424324036 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.12370584905147552, - "train/contrastive_loss": 1.4313215017318726, - "train/negative_loss": 0.36986830830574036, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.0614532232284546, - "train/total_loss": 0.40997016429901123 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16616418957710266, - "train/contrastive_loss": 0.5203867554664612, - "train/negative_loss": 0.3874633014202118, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.1329234540462494, - "train/total_loss": 0.27024155855178833 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.18788881599903107, - "train/contrastive_loss": 2.657607078552246, - "train/negative_loss": 1.0179007053375244, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.6397064924240112, - "train/total_loss": 0.719410240650177 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.20854291319847107, - "train/contrastive_loss": 2.9282314777374268, - "train/negative_loss": 1.6582093238830566, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.2700221538543701, - "train/total_loss": 0.7941892147064209 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.1522425264120102, - "train/contrastive_loss": 1.3664723634719849, - "train/negative_loss": 0.32655569911003113, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.0399166345596313, - "train/total_loss": 0.42553699016571045 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16552941501140594, - "train/contrastive_loss": 2.695533514022827, - "train/negative_loss": 1.68670654296875, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0088269710540771, - "train/total_loss": 0.7046361565589905 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.29617249965667725, - "train/contrastive_loss": 4.201747894287109, - "train/negative_loss": 1.4838809967041016, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.717866897583008, - "train/total_loss": 1.1365220546722412 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.24952805042266846, - "train/contrastive_loss": 3.6728296279907227, - "train/negative_loss": 1.50849187374115, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.1643378734588623, - "train/total_loss": 0.984093964099884 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.18536224961280823, - "train/contrastive_loss": 2.1500191688537598, - "train/negative_loss": 0.9314612150192261, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.2185578346252441, - "train/total_loss": 0.6153661012649536 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2325040102005005, - "train/contrastive_loss": 4.040821552276611, - "train/negative_loss": 1.6984604597091675, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.3423612117767334, - "train/total_loss": 1.040668249130249 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.2888477146625519, - "train/contrastive_loss": 4.097243309020996, - "train/negative_loss": 3.0284605026245117, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0687830448150635, - "train/total_loss": 1.1082963943481445 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.29759693145751953, - "train/contrastive_loss": 2.8279409408569336, - "train/negative_loss": 1.5795049667358398, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.2484358549118042, - "train/total_loss": 0.8631851077079773 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.11922968178987503, - "train/contrastive_loss": 0.372842013835907, - "train/negative_loss": 0.37284040451049805, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 1.609327000551275e-06, - "train/total_loss": 0.19379809498786926 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.14058470726013184, - "train/contrastive_loss": 1.034597396850586, - "train/negative_loss": 0.27334681153297424, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7612506151199341, - "train/total_loss": 0.347504198551178 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.10824552923440933, - "train/contrastive_loss": 1.2239439487457275, - "train/negative_loss": 0.3979693651199341, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.8259745836257935, - "train/total_loss": 0.3530343174934387 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.16867844760417938, - "train/contrastive_loss": 1.716456413269043, - "train/negative_loss": 1.716456413269043, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5119697451591492 - }, - { - "epoch": 15.96958174904943, - "eval_exact_match_accuracy": 0.3466666666666667, - "eval_hamming_loss": 0.0630812324929972, - "eval_loss": 0.5670315027236938, - "eval_macro_f1": 0.4264987300485739, - "eval_macro_precision": 0.6071176984091701, - "eval_macro_recall": 0.34903373045144337, - "eval_micro_f1": 0.6103806228373703, - "eval_micro_precision": 0.7791519434628975, - "eval_micro_recall": 0.5017064846416383, - "eval_runtime": 2.632, - "eval_samples_per_second": 199.47, - "eval_steps_per_second": 25.076, - "step": 4200 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.07531245797872543, - "train/contrastive_loss": 0.2301454395055771, - "train/negative_loss": 0.22989977896213531, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.0002456568763591349, - "train/total_loss": 0.12134154140949249 - }, - { - "epoch": 15.96958174904943, - "step": 4200, - "train/classification_loss": 0.10033910721540451, - "train/contrastive_loss": 2.052386522293091, - "train/negative_loss": 0.7195701599121094, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.3328163623809814, - "train/total_loss": 0.5108163952827454 - }, - { - "epoch": 16.159695817490494, - "grad_norm": 5.838689804077148, - "learning_rate": 1.93689497716895e-05, - "loss": 0.408, - "step": 4250 - }, - { - "epoch": 16.159695817490494, - "step": 4250, - "train/classification_loss": 0.06217866763472557, - "train/contrastive_loss": 0.4370507299900055, - "train/negative_loss": 0.4347321689128876, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0023185655009001493, - "train/total_loss": 0.14958880841732025 - }, - { - "epoch": 16.159695817490494, - "step": 4250, - "train/classification_loss": 0.0865689367055893, - "train/contrastive_loss": 1.032860517501831, - "train/negative_loss": 0.716185450553894, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.3166751265525818, - "train/total_loss": 0.29314103722572327 - }, - { - "epoch": 16.34980988593156, - "grad_norm": 14.20672607421875, - "learning_rate": 1.9361339421613398e-05, - "loss": 0.3713, - "step": 4300 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.3717307150363922, - "train/contrastive_loss": 2.85872220993042, - "train/negative_loss": 0.8161187767982483, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.0426034927368164, - "train/total_loss": 0.9434751272201538 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.14308595657348633, - "train/contrastive_loss": 1.8398113250732422, - "train/negative_loss": 1.3074291944503784, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5323821902275085, - "train/total_loss": 0.5110481977462769 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17299658060073853, - "train/contrastive_loss": 0.9243437647819519, - "train/negative_loss": 0.16181330382823944, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.7625304460525513, - "train/total_loss": 0.3578653335571289 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.23351773619651794, - "train/contrastive_loss": 3.4908549785614014, - "train/negative_loss": 2.297121286392212, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.1937336921691895, - "train/total_loss": 0.9316887855529785 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.08973296731710434, - "train/contrastive_loss": 1.5456323623657227, - "train/negative_loss": 1.284303069114685, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.2613292634487152, - "train/total_loss": 0.398859441280365 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.16266527771949768, - "train/contrastive_loss": 1.444595456123352, - "train/negative_loss": 1.0340975522994995, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.41049790382385254, - "train/total_loss": 0.4515843689441681 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.19917519390583038, - "train/contrastive_loss": 1.8662962913513184, - "train/negative_loss": 1.1528575420379639, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.7134387493133545, - "train/total_loss": 0.5724344849586487 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.12692062556743622, - "train/contrastive_loss": 1.2946845293045044, - "train/negative_loss": 1.190192461013794, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.10449205338954926, - "train/total_loss": 0.3858575224876404 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.13162477314472198, - "train/contrastive_loss": 1.2996766567230225, - "train/negative_loss": 1.2882577180862427, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.011418983340263367, - "train/total_loss": 0.3915601372718811 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.3313162326812744, - "train/contrastive_loss": 3.569892644882202, - "train/negative_loss": 1.9914090633392334, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.5784835815429688, - "train/total_loss": 1.0452947616577148 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.13842234015464783, - "train/contrastive_loss": 2.262816905975342, - "train/negative_loss": 1.5805188417434692, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6822981834411621, - "train/total_loss": 0.5909857153892517 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.10833518207073212, - "train/contrastive_loss": 2.3078277111053467, - "train/negative_loss": 0.8441100120544434, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.4637176990509033, - "train/total_loss": 0.5699007511138916 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.16807521879673004, - "train/contrastive_loss": 2.603693962097168, - "train/negative_loss": 1.860730767250061, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7429633140563965, - "train/total_loss": 0.6888139843940735 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.08429429680109024, - "train/contrastive_loss": 2.2183046340942383, - "train/negative_loss": 2.2176597118377686, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0006450102082453668, - "train/total_loss": 0.5279552340507507 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.12561023235321045, - "train/contrastive_loss": 2.5785117149353027, - "train/negative_loss": 1.1179577112197876, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.4605540037155151, - "train/total_loss": 0.6413125991821289 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.11769285053014755, - "train/contrastive_loss": 0.5933560132980347, - "train/negative_loss": 0.5099464654922485, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.08340957760810852, - "train/total_loss": 0.23636405169963837 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.20973870158195496, - "train/contrastive_loss": 2.5346224308013916, - "train/negative_loss": 1.5436993837356567, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9909230470657349, - "train/total_loss": 0.7166632413864136 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17585046589374542, - "train/contrastive_loss": 0.8615729808807373, - "train/negative_loss": 0.21075817942619324, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.6508147716522217, - "train/total_loss": 0.3481650650501251 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.21735456585884094, - "train/contrastive_loss": 2.9852330684661865, - "train/negative_loss": 2.0244486331939697, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.9607844352722168, - "train/total_loss": 0.8144011497497559 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.14686666429042816, - "train/contrastive_loss": 1.664607048034668, - "train/negative_loss": 0.169022798538208, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.49558424949646, - "train/total_loss": 0.47978806495666504 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.22418054938316345, - "train/contrastive_loss": 2.0621633529663086, - "train/negative_loss": 0.3450438976287842, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.717119574546814, - "train/total_loss": 0.6366132497787476 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.26061224937438965, - "train/contrastive_loss": 2.2203102111816406, - "train/negative_loss": 1.203181266784668, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.0171289443969727, - "train/total_loss": 0.7046743035316467 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.08100303262472153, - "train/contrastive_loss": 0.34540504217147827, - "train/negative_loss": 0.1270991861820221, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.21830585598945618, - "train/total_loss": 0.15008404850959778 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.14263086020946503, - "train/contrastive_loss": 0.31399065256118774, - "train/negative_loss": 0.2551105320453644, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.058880120515823364, - "train/total_loss": 0.20542898774147034 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.08935287594795227, - "train/contrastive_loss": 1.6211637258529663, - "train/negative_loss": 0.4061061441898346, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.215057611465454, - "train/total_loss": 0.4135856330394745 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.26951414346694946, - "train/contrastive_loss": 1.709012508392334, - "train/negative_loss": 0.18156594038009644, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.5274466276168823, - "train/total_loss": 0.6113166809082031 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.3049640357494354, - "train/contrastive_loss": 3.3912620544433594, - "train/negative_loss": 1.6735590696334839, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.717702865600586, - "train/total_loss": 0.983216404914856 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18628822267055511, - "train/contrastive_loss": 4.226194381713867, - "train/negative_loss": 3.136430025100708, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.0897645950317383, - "train/total_loss": 1.031527042388916 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18270237743854523, - "train/contrastive_loss": 1.5399267673492432, - "train/negative_loss": 0.5638517141342163, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9760749936103821, - "train/total_loss": 0.4906877279281616 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.20316950976848602, - "train/contrastive_loss": 0.6118715405464172, - "train/negative_loss": 0.48567506670951843, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.1261964738368988, - "train/total_loss": 0.3255438208580017 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.10195034742355347, - "train/contrastive_loss": 1.2784733772277832, - "train/negative_loss": 0.6907278299331665, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5877455472946167, - "train/total_loss": 0.35764503479003906 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.19827954471111298, - "train/contrastive_loss": 2.954085350036621, - "train/negative_loss": 1.3595457077026367, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.5945396423339844, - "train/total_loss": 0.7890966534614563 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.19455614686012268, - "train/contrastive_loss": 0.5734928846359253, - "train/negative_loss": 0.5732309818267822, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00026187748881056905, - "train/total_loss": 0.3092547357082367 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18884533643722534, - "train/contrastive_loss": 2.1669509410858154, - "train/negative_loss": 1.2047160863876343, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.9622348546981812, - "train/total_loss": 0.6222355365753174 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.21836435794830322, - "train/contrastive_loss": 4.688049793243408, - "train/negative_loss": 3.1949827671051025, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4930669069290161, - "train/total_loss": 1.1559743881225586 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17183785140514374, - "train/contrastive_loss": 3.0726547241210938, - "train/negative_loss": 1.3245550394058228, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7480995655059814, - "train/total_loss": 0.7863688468933105 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.10691876709461212, - "train/contrastive_loss": 0.5974500775337219, - "train/negative_loss": 0.36591362953186035, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.23153643310070038, - "train/total_loss": 0.22640877962112427 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17395173013210297, - "train/contrastive_loss": 0.9707255959510803, - "train/negative_loss": 0.9467006921768188, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.024024924263358116, - "train/total_loss": 0.36809685826301575 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18032482266426086, - "train/contrastive_loss": 1.8292758464813232, - "train/negative_loss": 1.8092120885849, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.020063795149326324, - "train/total_loss": 0.546180009841919 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17769712209701538, - "train/contrastive_loss": 2.1045069694519043, - "train/negative_loss": 2.0761091709136963, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0283976923674345, - "train/total_loss": 0.5985984802246094 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.21098850667476654, - "train/contrastive_loss": 2.4231457710266113, - "train/negative_loss": 1.5511841773986816, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.8719615340232849, - "train/total_loss": 0.69561767578125 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18215732276439667, - "train/contrastive_loss": 2.4064650535583496, - "train/negative_loss": 1.7427747249603271, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.6636902093887329, - "train/total_loss": 0.6634503602981567 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18589390814304352, - "train/contrastive_loss": 1.5261871814727783, - "train/negative_loss": 0.41152599453926086, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.1146612167358398, - "train/total_loss": 0.49113136529922485 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.1792551726102829, - "train/contrastive_loss": 3.022465229034424, - "train/negative_loss": 1.3104240894317627, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7120411396026611, - "train/total_loss": 0.7837482690811157 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.12042786180973053, - "train/contrastive_loss": 1.1742925643920898, - "train/negative_loss": 0.47541627287864685, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6988762617111206, - "train/total_loss": 0.3552863597869873 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.2984105944633484, - "train/contrastive_loss": 0.9117871522903442, - "train/negative_loss": 0.5520508289337158, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.3597363233566284, - "train/total_loss": 0.48076802492141724 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.10284770280122757, - "train/contrastive_loss": 0.779131293296814, - "train/negative_loss": 0.779130220413208, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.0430818520035245e-06, - "train/total_loss": 0.2586739659309387 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.11666480451822281, - "train/contrastive_loss": 0.9150683283805847, - "train/negative_loss": 0.15241378545761108, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.7626545429229736, - "train/total_loss": 0.2996784746646881 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.12235077470541, - "train/contrastive_loss": 2.279966354370117, - "train/negative_loss": 1.5868895053863525, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.6930767893791199, - "train/total_loss": 0.5783440470695496 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.15643535554409027, - "train/contrastive_loss": 0.6157607436180115, - "train/negative_loss": 0.6077399253845215, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.008020828478038311, - "train/total_loss": 0.2795875072479248 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.14361275732517242, - "train/contrastive_loss": 1.7793076038360596, - "train/negative_loss": 0.35590827465057373, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.4233993291854858, - "train/total_loss": 0.49947428703308105 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.16574977338314056, - "train/contrastive_loss": 0.36629214882850647, - "train/negative_loss": 0.3655816614627838, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.0007104964461177588, - "train/total_loss": 0.23900820314884186 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.16746728122234344, - "train/contrastive_loss": 0.85031658411026, - "train/negative_loss": 0.4808352291584015, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3694813549518585, - "train/total_loss": 0.33753061294555664 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.21009887754917145, - "train/contrastive_loss": 3.135467290878296, - "train/negative_loss": 2.42741060256958, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.708056628704071, - "train/total_loss": 0.8371923565864563 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.10402745753526688, - "train/contrastive_loss": 0.34878334403038025, - "train/negative_loss": 0.21874482929706573, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.13003851473331451, - "train/total_loss": 0.17378413677215576 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.17885833978652954, - "train/contrastive_loss": 2.976893424987793, - "train/negative_loss": 2.0685696601867676, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9083238840103149, - "train/total_loss": 0.7742370367050171 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.28274279832839966, - "train/contrastive_loss": 2.94087553024292, - "train/negative_loss": 1.401755928993225, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.5391196012496948, - "train/total_loss": 0.8709179162979126 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.23684470355510712, - "train/contrastive_loss": 2.908329963684082, - "train/negative_loss": 1.6028670072555542, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.3054630756378174, - "train/total_loss": 0.8185107111930847 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.16822074353694916, - "train/contrastive_loss": 3.0217223167419434, - "train/negative_loss": 2.3296937942504883, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6920285820960999, - "train/total_loss": 0.7725652456283569 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.2695653736591339, - "train/contrastive_loss": 3.840007781982422, - "train/negative_loss": 1.687527060508728, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.1524808406829834, - "train/total_loss": 1.037566900253296 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.3013212978839874, - "train/contrastive_loss": 5.875392436981201, - "train/negative_loss": 4.686075687408447, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.1893168687820435, - "train/total_loss": 1.4763997793197632 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.32676708698272705, - "train/contrastive_loss": 3.4834933280944824, - "train/negative_loss": 1.7541736364364624, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.7293198108673096, - "train/total_loss": 1.0234657526016235 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.1370600312948227, - "train/contrastive_loss": 0.42678070068359375, - "train/negative_loss": 0.42673182487487793, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 4.88781624881085e-05, - "train/total_loss": 0.22241616249084473 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.15153411030769348, - "train/contrastive_loss": 1.0579906702041626, - "train/negative_loss": 0.23839439451694489, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8195962905883789, - "train/total_loss": 0.3631322383880615 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.08908506482839584, - "train/contrastive_loss": 1.0389995574951172, - "train/negative_loss": 0.3320072591304779, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.7069923281669617, - "train/total_loss": 0.2968849837779999 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.18538373708724976, - "train/contrastive_loss": 1.6266587972640991, - "train/negative_loss": 1.6266587972640991, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5107154846191406 - }, - { - "epoch": 16.34980988593156, - "eval_exact_match_accuracy": 0.33904761904761904, - "eval_hamming_loss": 0.06375350140056023, - "eval_loss": 0.576992392539978, - "eval_macro_f1": 0.42983393055197927, - "eval_macro_precision": 0.5605311223042906, - "eval_macro_recall": 0.3637469443978699, - "eval_micro_f1": 0.6178643384822028, - "eval_micro_precision": 0.7540983606557377, - "eval_micro_recall": 0.5233219567690558, - "eval_runtime": 2.613, - "eval_samples_per_second": 200.919, - "eval_steps_per_second": 25.258, - "step": 4300 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.11425904184579849, - "train/contrastive_loss": 0.7012526392936707, - "train/negative_loss": 0.13769622147083282, - "train/num_negatives": 36, - "train/num_positives": 12, - "train/positive_loss": 0.563556432723999, - "train/total_loss": 0.2545095682144165 - }, - { - "epoch": 16.34980988593156, - "step": 4300, - "train/classification_loss": 0.05886480584740639, - "train/contrastive_loss": 0.02984859049320221, - "train/negative_loss": 0.027219951152801514, - "train/num_negatives": 20, - "train/num_positives": 36, - "train/positive_loss": 0.002628638641908765, - "train/total_loss": 0.06483452022075653 - }, - { - "epoch": 16.539923954372625, - "grad_norm": 6.059859752655029, - "learning_rate": 1.9353729071537292e-05, - "loss": 0.394, - "step": 4350 - }, - { - "epoch": 16.539923954372625, - "step": 4350, - "train/classification_loss": 0.08014367520809174, - "train/contrastive_loss": 0.18099156022071838, - "train/negative_loss": 0.18006038665771484, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0009311758331023157, - "train/total_loss": 0.11634199321269989 - }, - { - "epoch": 16.539923954372625, - "step": 4350, - "train/classification_loss": 0.12197644263505936, - "train/contrastive_loss": 0.8297626376152039, - "train/negative_loss": 0.5818992257118225, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.24786341190338135, - "train/total_loss": 0.287928968667984 - }, - { - "epoch": 16.730038022813687, - "grad_norm": 5.134601593017578, - "learning_rate": 1.934611872146119e-05, - "loss": 0.3835, - "step": 4400 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.3877705931663513, - "train/contrastive_loss": 3.203092336654663, - "train/negative_loss": 1.0770843029022217, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.1260080337524414, - "train/total_loss": 1.0283890962600708 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.13576814532279968, - "train/contrastive_loss": 1.4885245561599731, - "train/negative_loss": 0.943485677242279, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5450388789176941, - "train/total_loss": 0.43347305059432983 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.17818395793437958, - "train/contrastive_loss": 0.934249222278595, - "train/negative_loss": 0.227386474609375, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.70686274766922, - "train/total_loss": 0.3650338053703308 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.23663416504859924, - "train/contrastive_loss": 3.449477195739746, - "train/negative_loss": 2.153383731842041, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2960933446884155, - "train/total_loss": 0.9265296459197998 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.08220423012971878, - "train/contrastive_loss": 1.4964970350265503, - "train/negative_loss": 0.8402064442634583, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.656290590763092, - "train/total_loss": 0.3815036416053772 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.22283177077770233, - "train/contrastive_loss": 2.617959499359131, - "train/negative_loss": 1.6892750263214111, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.9286844730377197, - "train/total_loss": 0.7464237213134766 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.23868970572948456, - "train/contrastive_loss": 2.3450212478637695, - "train/negative_loss": 1.6007342338562012, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.7442868947982788, - "train/total_loss": 0.7076939344406128 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1375311315059662, - "train/contrastive_loss": 1.4322725534439087, - "train/negative_loss": 0.9693885445594788, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4628840386867523, - "train/total_loss": 0.42398566007614136 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.13918723165988922, - "train/contrastive_loss": 1.1706489324569702, - "train/negative_loss": 1.1278457641601562, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.04280312359333038, - "train/total_loss": 0.37331700325012207 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.3352401554584503, - "train/contrastive_loss": 2.9400837421417236, - "train/negative_loss": 1.3941231966018677, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.545960545539856, - "train/total_loss": 0.9232568740844727 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.16933783888816833, - "train/contrastive_loss": 2.4957046508789062, - "train/negative_loss": 1.6336815357208252, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8620232343673706, - "train/total_loss": 0.668478786945343 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.10739888995885849, - "train/contrastive_loss": 1.502821445465088, - "train/negative_loss": 0.9019818305969238, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.6008395552635193, - "train/total_loss": 0.40796318650245667 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1535145491361618, - "train/contrastive_loss": 1.3349573612213135, - "train/negative_loss": 1.2316416501998901, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.10331565886735916, - "train/total_loss": 0.42050600051879883 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09319161623716354, - "train/contrastive_loss": 1.928959846496582, - "train/negative_loss": 1.9289281368255615, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 3.170523632434197e-05, - "train/total_loss": 0.478983610868454 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.10329818725585938, - "train/contrastive_loss": 2.1243977546691895, - "train/negative_loss": 0.8862850666046143, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.2381126880645752, - "train/total_loss": 0.5281777381896973 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1692139059305191, - "train/contrastive_loss": 1.3668396472930908, - "train/negative_loss": 0.7539342641830444, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.6129054427146912, - "train/total_loss": 0.44258183240890503 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2459591180086136, - "train/contrastive_loss": 2.0023193359375, - "train/negative_loss": 1.200731873512268, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8015874028205872, - "train/total_loss": 0.6464229822158813 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.155077263712883, - "train/contrastive_loss": 1.335233449935913, - "train/negative_loss": 0.6283228397369385, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7069106101989746, - "train/total_loss": 0.4221239686012268 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.22265933454036713, - "train/contrastive_loss": 1.4416980743408203, - "train/negative_loss": 1.1589338779449463, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.2827642560005188, - "train/total_loss": 0.5109989643096924 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.16798700392246246, - "train/contrastive_loss": 2.852206230163574, - "train/negative_loss": 1.9367897510528564, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9154165387153625, - "train/total_loss": 0.7384282350540161 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.20652085542678833, - "train/contrastive_loss": 2.201566219329834, - "train/negative_loss": 0.42794185876846313, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.773624300956726, - "train/total_loss": 0.646834135055542 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.24263957142829895, - "train/contrastive_loss": 1.8541011810302734, - "train/negative_loss": 1.0574225187301636, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.7966786623001099, - "train/total_loss": 0.6134598255157471 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09300613403320312, - "train/contrastive_loss": 0.5404849052429199, - "train/negative_loss": 0.17153897881507874, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.3689459562301636, - "train/total_loss": 0.2011031210422516 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1426292061805725, - "train/contrastive_loss": 0.9144389629364014, - "train/negative_loss": 0.10225415229797363, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.8121848106384277, - "train/total_loss": 0.3255169987678528 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.06576687842607498, - "train/contrastive_loss": 0.9425181746482849, - "train/negative_loss": 0.18862955272197723, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7538886070251465, - "train/total_loss": 0.2542705237865448 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.3055146634578705, - "train/contrastive_loss": 1.7592209577560425, - "train/negative_loss": 0.28340235352516174, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.4758186340332031, - "train/total_loss": 0.6573588848114014 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.3410005569458008, - "train/contrastive_loss": 3.52528715133667, - "train/negative_loss": 1.7497261762619019, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.7755608558654785, - "train/total_loss": 1.046057939529419 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.19003035128116608, - "train/contrastive_loss": 4.310844898223877, - "train/negative_loss": 3.2553701400756836, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.0554746389389038, - "train/total_loss": 1.052199363708496 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1724582314491272, - "train/contrastive_loss": 1.5460114479064941, - "train/negative_loss": 0.6261506676673889, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9198607802391052, - "train/total_loss": 0.48166051506996155 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2050107717514038, - "train/contrastive_loss": 0.8536479473114014, - "train/negative_loss": 0.5414202809333801, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.31222769618034363, - "train/total_loss": 0.3757403492927551 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09848406165838242, - "train/contrastive_loss": 2.5654804706573486, - "train/negative_loss": 2.03735089302063, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.528129518032074, - "train/total_loss": 0.6115801334381104 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1924998015165329, - "train/contrastive_loss": 2.6150295734405518, - "train/negative_loss": 1.2216559648513794, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3933736085891724, - "train/total_loss": 0.7155057191848755 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2028246521949768, - "train/contrastive_loss": 0.4407005310058594, - "train/negative_loss": 0.4338494539260864, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.006851067300885916, - "train/total_loss": 0.2909647524356842 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.15781068801879883, - "train/contrastive_loss": 0.4796915650367737, - "train/negative_loss": 0.47516101598739624, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.004530562087893486, - "train/total_loss": 0.2537490129470825 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.20686247944831848, - "train/contrastive_loss": 3.213501453399658, - "train/negative_loss": 2.525153398513794, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.6883479356765747, - "train/total_loss": 0.8495627641677856 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1926853358745575, - "train/contrastive_loss": 3.124483346939087, - "train/negative_loss": 1.2496953010559082, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.8747880458831787, - "train/total_loss": 0.8175820112228394 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09919288754463196, - "train/contrastive_loss": 0.5283417701721191, - "train/negative_loss": 0.24581420421600342, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.28252753615379333, - "train/total_loss": 0.20486125349998474 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1569875180721283, - "train/contrastive_loss": 0.9571613073348999, - "train/negative_loss": 0.9558516144752502, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.0013097156770527363, - "train/total_loss": 0.34841978549957275 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1950511783361435, - "train/contrastive_loss": 1.8912838697433472, - "train/negative_loss": 1.8473824262619019, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.04390140622854233, - "train/total_loss": 0.5733079314231873 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.21422211825847626, - "train/contrastive_loss": 3.255129337310791, - "train/negative_loss": 3.2414743900299072, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.013654888607561588, - "train/total_loss": 0.8652480244636536 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.18327274918556213, - "train/contrastive_loss": 2.1786603927612305, - "train/negative_loss": 1.360323429107666, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.818337082862854, - "train/total_loss": 0.6190048456192017 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1719771772623062, - "train/contrastive_loss": 2.6529479026794434, - "train/negative_loss": 2.240316390991211, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.4126315116882324, - "train/total_loss": 0.7025667428970337 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.19194278120994568, - "train/contrastive_loss": 1.874756097793579, - "train/negative_loss": 0.35011738538742065, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5246386528015137, - "train/total_loss": 0.566893994808197 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.16225963830947876, - "train/contrastive_loss": 1.5792362689971924, - "train/negative_loss": 0.7340946197509766, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.8451417088508606, - "train/total_loss": 0.47810688614845276 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.10167115181684494, - "train/contrastive_loss": 1.3626725673675537, - "train/negative_loss": 0.8109309077262878, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5517416000366211, - "train/total_loss": 0.37420567870140076 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2867547273635864, - "train/contrastive_loss": 0.7038535475730896, - "train/negative_loss": 0.4295876920223236, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.274265855550766, - "train/total_loss": 0.42752546072006226 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.12241733819246292, - "train/contrastive_loss": 1.2267582416534424, - "train/negative_loss": 1.2267558574676514, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.384189883741783e-06, - "train/total_loss": 0.3677690029144287 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.13760529458522797, - "train/contrastive_loss": 1.4033689498901367, - "train/negative_loss": 0.300590455532074, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.102778434753418, - "train/total_loss": 0.41827911138534546 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.07041282951831818, - "train/contrastive_loss": 0.6130139231681824, - "train/negative_loss": 0.611697793006897, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.0013161383103579283, - "train/total_loss": 0.19301560521125793 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.14778435230255127, - "train/contrastive_loss": 0.4621056914329529, - "train/negative_loss": 0.358675092458725, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.10343058407306671, - "train/total_loss": 0.24020549654960632 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.134255513548851, - "train/contrastive_loss": 2.004323720932007, - "train/negative_loss": 0.5757400393486023, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.4285837411880493, - "train/total_loss": 0.5351202487945557 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.17631572484970093, - "train/contrastive_loss": 0.733598530292511, - "train/negative_loss": 0.36049792170524597, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.373100608587265, - "train/total_loss": 0.32303541898727417 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.14672636985778809, - "train/contrastive_loss": 1.515365719795227, - "train/negative_loss": 0.9518352746963501, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.563530445098877, - "train/total_loss": 0.449799507856369 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2480601668357849, - "train/contrastive_loss": 4.21079158782959, - "train/negative_loss": 2.9143424034118652, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.296449065208435, - "train/total_loss": 1.0902185440063477 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.15060003101825714, - "train/contrastive_loss": 0.7987398505210876, - "train/negative_loss": 0.2405894249677658, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5581504106521606, - "train/total_loss": 0.3103480041027069 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.17762288451194763, - "train/contrastive_loss": 2.8790130615234375, - "train/negative_loss": 1.9147504568099976, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.9642626047134399, - "train/total_loss": 0.7534254789352417 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.30021145939826965, - "train/contrastive_loss": 4.034943580627441, - "train/negative_loss": 1.6135274171829224, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.4214160442352295, - "train/total_loss": 1.1072001457214355 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.22287686169147491, - "train/contrastive_loss": 3.3506107330322266, - "train/negative_loss": 1.5944875478744507, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7561230659484863, - "train/total_loss": 0.892998993396759 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.16655080020427704, - "train/contrastive_loss": 3.021552085876465, - "train/negative_loss": 2.0079805850982666, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.0135713815689087, - "train/total_loss": 0.7708612680435181 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.2712824046611786, - "train/contrastive_loss": 3.5945639610290527, - "train/negative_loss": 1.526096224784851, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.068467855453491, - "train/total_loss": 0.9901951551437378 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.277178555727005, - "train/contrastive_loss": 4.471060752868652, - "train/negative_loss": 3.415706157684326, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0553544759750366, - "train/total_loss": 1.1713907718658447 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.30586105585098267, - "train/contrastive_loss": 3.2456021308898926, - "train/negative_loss": 1.6726555824279785, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.572946548461914, - "train/total_loss": 0.9549815058708191 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.12864471971988678, - "train/contrastive_loss": 0.4238523244857788, - "train/negative_loss": 0.4238291382789612, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 2.318672886758577e-05, - "train/total_loss": 0.21341517567634583 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1698826402425766, - "train/contrastive_loss": 1.563974380493164, - "train/negative_loss": 0.8192265629768372, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7447478175163269, - "train/total_loss": 0.48267751932144165 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09117751568555832, - "train/contrastive_loss": 0.898037314414978, - "train/negative_loss": 0.2793367803096771, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.6187005639076233, - "train/total_loss": 0.27078497409820557 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.16629937291145325, - "train/contrastive_loss": 1.5377899408340454, - "train/negative_loss": 1.5377899408340454, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.4738573729991913 - }, - { - "epoch": 16.730038022813687, - "eval_exact_match_accuracy": 0.35428571428571426, - "eval_hamming_loss": 0.06330532212885154, - "eval_loss": 0.5753819942474365, - "eval_macro_f1": 0.4364261070610746, - "eval_macro_precision": 0.5642525355037066, - "eval_macro_recall": 0.3715877891331569, - "eval_micro_f1": 0.6255798542080848, - "eval_micro_precision": 0.7492063492063492, - "eval_micro_recall": 0.5369738339021616, - "eval_runtime": 2.6266, - "eval_samples_per_second": 199.875, - "eval_steps_per_second": 25.127, - "step": 4400 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.1704730987548828, - "train/contrastive_loss": 0.6433194279670715, - "train/negative_loss": 0.1492272913455963, - "train/num_negatives": 32, - "train/num_positives": 14, - "train/positive_loss": 0.4940921366214752, - "train/total_loss": 0.2991369962692261 - }, - { - "epoch": 16.730038022813687, - "step": 4400, - "train/classification_loss": 0.09958015382289886, - "train/contrastive_loss": 0.5088069438934326, - "train/negative_loss": 0.1752946376800537, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.3335123062133789, - "train/total_loss": 0.20134153962135315 - }, - { - "epoch": 16.920152091254753, - "grad_norm": 2.8697850704193115, - "learning_rate": 1.9338508371385085e-05, - "loss": 0.3825, - "step": 4450 - }, - { - "epoch": 16.920152091254753, - "step": 4450, - "train/classification_loss": 0.10762356966733932, - "train/contrastive_loss": 0.5198705792427063, - "train/negative_loss": 0.517063558101654, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.0028070290572941303, - "train/total_loss": 0.21159768104553223 - }, - { - "epoch": 16.920152091254753, - "step": 4450, - "train/classification_loss": 0.08878862857818604, - "train/contrastive_loss": 0.5676151514053345, - "train/negative_loss": 0.5017136335372925, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.0659015029668808, - "train/total_loss": 0.2023116648197174 - }, - { - "epoch": 17.11026615969582, - "grad_norm": 9.083450317382812, - "learning_rate": 1.933089802130898e-05, - "loss": 0.3723, - "step": 4500 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.3689402937889099, - "train/contrastive_loss": 2.5858466625213623, - "train/negative_loss": 0.8434430956840515, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.7424036264419556, - "train/total_loss": 0.8861096501350403 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1400391012430191, - "train/contrastive_loss": 1.9353450536727905, - "train/negative_loss": 1.3760384321212769, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5593066215515137, - "train/total_loss": 0.5271081328392029 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.18338851630687714, - "train/contrastive_loss": 1.4955286979675293, - "train/negative_loss": 0.46628686785697937, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0292418003082275, - "train/total_loss": 0.4824942350387573 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.229106143116951, - "train/contrastive_loss": 3.308323383331299, - "train/negative_loss": 2.1232757568359375, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.1850476264953613, - "train/total_loss": 0.8907707929611206 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.09233406186103821, - "train/contrastive_loss": 1.7687108516693115, - "train/negative_loss": 1.2684876918792725, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.5002231001853943, - "train/total_loss": 0.44607624411582947 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.19551487267017365, - "train/contrastive_loss": 1.8828002214431763, - "train/negative_loss": 1.0371919870376587, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.8456082344055176, - "train/total_loss": 0.5720749497413635 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.23140306770801544, - "train/contrastive_loss": 3.006122350692749, - "train/negative_loss": 1.8584918975830078, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.1476304531097412, - "train/total_loss": 0.832627534866333 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1209239810705185, - "train/contrastive_loss": 1.4806891679763794, - "train/negative_loss": 1.103934407234192, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.3767547309398651, - "train/total_loss": 0.41706180572509766 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.14016102254390717, - "train/contrastive_loss": 0.8744674324989319, - "train/negative_loss": 0.8681783080101013, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.00628912216052413, - "train/total_loss": 0.3150545060634613 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.3448367416858673, - "train/contrastive_loss": 2.7227253913879395, - "train/negative_loss": 1.2448450326919556, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4778802394866943, - "train/total_loss": 0.8893818855285645 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.17748822271823883, - "train/contrastive_loss": 2.6607394218444824, - "train/negative_loss": 1.5447520017623901, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.1159873008728027, - "train/total_loss": 0.7096360921859741 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.11174210160970688, - "train/contrastive_loss": 0.8854286670684814, - "train/negative_loss": 0.28884565830230713, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.5965830087661743, - "train/total_loss": 0.2888278365135193 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.16870182752609253, - "train/contrastive_loss": 2.33526611328125, - "train/negative_loss": 1.6515558958053589, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.6837100982666016, - "train/total_loss": 0.6357550621032715 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.08696343004703522, - "train/contrastive_loss": 2.194040060043335, - "train/negative_loss": 2.193779468536377, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0002606094058137387, - "train/total_loss": 0.52577143907547 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.11243107914924622, - "train/contrastive_loss": 2.4295849800109863, - "train/negative_loss": 1.0480668544769287, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.381518006324768, - "train/total_loss": 0.598348081111908 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.14247675240039825, - "train/contrastive_loss": 0.8975282907485962, - "train/negative_loss": 0.4324897527694702, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.465038537979126, - "train/total_loss": 0.32198241353034973 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.24202613532543182, - "train/contrastive_loss": 2.0672271251678467, - "train/negative_loss": 0.8501841425895691, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.2170429229736328, - "train/total_loss": 0.6554715633392334 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1807321459054947, - "train/contrastive_loss": 1.8107895851135254, - "train/negative_loss": 1.0681005716323853, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7426890134811401, - "train/total_loss": 0.5428900718688965 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1903330534696579, - "train/contrastive_loss": 1.409553050994873, - "train/negative_loss": 0.8726785182952881, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.5368744730949402, - "train/total_loss": 0.47224366664886475 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1250700056552887, - "train/contrastive_loss": 2.101668357849121, - "train/negative_loss": 0.8072668313980103, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.2944015264511108, - "train/total_loss": 0.5454037189483643 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.2182636857032776, - "train/contrastive_loss": 1.4891400337219238, - "train/negative_loss": 0.24169263243675232, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.2474473714828491, - "train/total_loss": 0.5160917043685913 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.22179704904556274, - "train/contrastive_loss": 2.043473482131958, - "train/negative_loss": 0.7152882218360901, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.3281853199005127, - "train/total_loss": 0.6304917335510254 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.10719186067581177, - "train/contrastive_loss": 1.327432632446289, - "train/negative_loss": 0.3817008435726166, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9457318186759949, - "train/total_loss": 0.37267839908599854 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.15345582365989685, - "train/contrastive_loss": 0.47471463680267334, - "train/negative_loss": 0.19230592250823975, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.2824087142944336, - "train/total_loss": 0.24839875102043152 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.09227611124515533, - "train/contrastive_loss": 1.4265799522399902, - "train/negative_loss": 0.3429115116596222, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.0836684703826904, - "train/total_loss": 0.3775920867919922 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.3155495226383209, - "train/contrastive_loss": 1.805492639541626, - "train/negative_loss": 0.2205517590045929, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.5849409103393555, - "train/total_loss": 0.6766480207443237 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.2971342206001282, - "train/contrastive_loss": 3.601205825805664, - "train/negative_loss": 1.784561276435852, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.816644549369812, - "train/total_loss": 1.0173754692077637 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.17784050107002258, - "train/contrastive_loss": 3.813019275665283, - "train/negative_loss": 2.392852306365967, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.420167088508606, - "train/total_loss": 0.9404443502426147 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.19840097427368164, - "train/contrastive_loss": 1.7779202461242676, - "train/negative_loss": 0.57786625623703, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.2000540494918823, - "train/total_loss": 0.5539849996566772 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.21731741726398468, - "train/contrastive_loss": 1.8804306983947754, - "train/negative_loss": 1.564897060394287, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.31553366780281067, - "train/total_loss": 0.5934035778045654 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.10779757797718048, - "train/contrastive_loss": 2.311380386352539, - "train/negative_loss": 1.199515700340271, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.1118648052215576, - "train/total_loss": 0.570073664188385 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.18317000567913055, - "train/contrastive_loss": 2.847766876220703, - "train/negative_loss": 1.5373291969299316, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3104376792907715, - "train/total_loss": 0.7527233958244324 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.2319207787513733, - "train/contrastive_loss": 0.7929688692092896, - "train/negative_loss": 0.7923679947853088, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0006008761120028794, - "train/total_loss": 0.3905145525932312 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.16661661863327026, - "train/contrastive_loss": 1.1734925508499146, - "train/negative_loss": 0.6028854250907898, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.5706071257591248, - "train/total_loss": 0.4013151526451111 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.20942452549934387, - "train/contrastive_loss": 3.123014211654663, - "train/negative_loss": 2.3798279762268066, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.7431862354278564, - "train/total_loss": 0.8340274095535278 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.20320247113704681, - "train/contrastive_loss": 3.1585381031036377, - "train/negative_loss": 1.2578110694885254, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.9007270336151123, - "train/total_loss": 0.8349100947380066 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.11460702866315842, - "train/contrastive_loss": 0.8014159202575684, - "train/negative_loss": 0.45161187648773193, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.3498040735721588, - "train/total_loss": 0.2748902142047882 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.16037146747112274, - "train/contrastive_loss": 2.3664658069610596, - "train/negative_loss": 0.9048004150390625, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.461665391921997, - "train/total_loss": 0.633664608001709 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.18912525475025177, - "train/contrastive_loss": 1.3087022304534912, - "train/negative_loss": 1.2953211069107056, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.013381104916334152, - "train/total_loss": 0.4508656859397888 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.20274309813976288, - "train/contrastive_loss": 1.9804050922393799, - "train/negative_loss": 1.9703515768051147, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.010053456760942936, - "train/total_loss": 0.598824143409729 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1594841331243515, - "train/contrastive_loss": 1.3064197301864624, - "train/negative_loss": 1.1703318357467651, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.13608789443969727, - "train/total_loss": 0.4207680821418762 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.17631204426288605, - "train/contrastive_loss": 2.2744035720825195, - "train/negative_loss": 1.618899941444397, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.6555035710334778, - "train/total_loss": 0.6311927437782288 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1857835352420807, - "train/contrastive_loss": 2.2959587574005127, - "train/negative_loss": 0.5405935645103455, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.755365252494812, - "train/total_loss": 0.6449753046035767 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.19750508666038513, - "train/contrastive_loss": 3.2884716987609863, - "train/negative_loss": 1.4540666341781616, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8344051837921143, - "train/total_loss": 0.8551994562149048 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.10866712033748627, - "train/contrastive_loss": 0.8066895008087158, - "train/negative_loss": 0.3967432975769043, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.40994617342948914, - "train/total_loss": 0.2700050175189972 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.2550738751888275, - "train/contrastive_loss": 0.9642300605773926, - "train/negative_loss": 0.5414025187492371, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.4228275418281555, - "train/total_loss": 0.44791990518569946 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1058429405093193, - "train/contrastive_loss": 0.3998004198074341, - "train/negative_loss": 0.3997820317745209, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.8388360331300646e-05, - "train/total_loss": 0.18580302596092224 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.14176255464553833, - "train/contrastive_loss": 1.6391658782958984, - "train/negative_loss": 0.7084370851516724, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.9307287335395813, - "train/total_loss": 0.469595730304718 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.08569186180830002, - "train/contrastive_loss": 0.9134218096733093, - "train/negative_loss": 0.9084799885749817, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.004941806197166443, - "train/total_loss": 0.2683762311935425 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.14886751770973206, - "train/contrastive_loss": 0.5080883502960205, - "train/negative_loss": 0.47425684332847595, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.03383148834109306, - "train/total_loss": 0.2504851818084717 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.14199198782444, - "train/contrastive_loss": 2.563875675201416, - "train/negative_loss": 0.7201023101806641, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.8437732458114624, - "train/total_loss": 0.6547670960426331 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.15723614394664764, - "train/contrastive_loss": 0.43171370029449463, - "train/negative_loss": 0.2408907413482666, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.19082295894622803, - "train/total_loss": 0.24357888102531433 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.20335781574249268, - "train/contrastive_loss": 1.8160574436187744, - "train/negative_loss": 1.1792476177215576, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6368098258972168, - "train/total_loss": 0.5665693283081055 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.22111685574054718, - "train/contrastive_loss": 3.2291884422302246, - "train/negative_loss": 2.892106294631958, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.33708226680755615, - "train/total_loss": 0.8669545650482178 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1551881581544876, - "train/contrastive_loss": 1.058903694152832, - "train/negative_loss": 0.46582847833633423, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5930752754211426, - "train/total_loss": 0.36696889996528625 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1725686937570572, - "train/contrastive_loss": 3.1538031101226807, - "train/negative_loss": 1.9081330299377441, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2456700801849365, - "train/total_loss": 0.8033292889595032 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.31499147415161133, - "train/contrastive_loss": 4.271336078643799, - "train/negative_loss": 1.7353076934814453, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.5360283851623535, - "train/total_loss": 1.169258713722229 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.25374850630760193, - "train/contrastive_loss": 3.846853256225586, - "train/negative_loss": 1.8577216863632202, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.9891314506530762, - "train/total_loss": 1.0231192111968994 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.13990719616413116, - "train/contrastive_loss": 0.9235433340072632, - "train/negative_loss": 0.7943394780158997, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.1292038857936859, - "train/total_loss": 0.32461586594581604 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.24687407910823822, - "train/contrastive_loss": 3.4083938598632812, - "train/negative_loss": 1.549236536026001, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.8591572046279907, - "train/total_loss": 0.9285528659820557 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.27030450105667114, - "train/contrastive_loss": 5.633761882781982, - "train/negative_loss": 4.170772075653076, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.4629898071289062, - "train/total_loss": 1.3970568180084229 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.3105849027633667, - "train/contrastive_loss": 3.3342673778533936, - "train/negative_loss": 1.6889910697937012, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.6452763080596924, - "train/total_loss": 0.9774383902549744 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.11357920616865158, - "train/contrastive_loss": 0.3030424416065216, - "train/negative_loss": 0.30303606390953064, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 6.377733370754868e-06, - "train/total_loss": 0.17418769001960754 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.1693533957004547, - "train/contrastive_loss": 1.2684032917022705, - "train/negative_loss": 0.5423550009727478, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7260482907295227, - "train/total_loss": 0.42303407192230225 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.11574644595384598, - "train/contrastive_loss": 1.52317214012146, - "train/negative_loss": 0.5109732151031494, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.0121989250183105, - "train/total_loss": 0.4203808605670929 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.17961038649082184, - "train/contrastive_loss": 1.5780645608901978, - "train/negative_loss": 1.5780645608901978, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.4952232837677002 - }, - { - "epoch": 17.11026615969582, - "eval_exact_match_accuracy": 0.3523809523809524, - "eval_hamming_loss": 0.0630812324929972, - "eval_loss": 0.5838881134986877, - "eval_macro_f1": 0.454954815355689, - "eval_macro_precision": 0.5978258454745724, - "eval_macro_recall": 0.396890331473434, - "eval_micro_f1": 0.6313032089063523, - "eval_micro_precision": 0.7438271604938271, - "eval_micro_recall": 0.5483503981797497, - "eval_runtime": 2.6306, - "eval_samples_per_second": 199.574, - "eval_steps_per_second": 25.089, - "step": 4500 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.0882859155535698, - "train/contrastive_loss": 0.2636205852031708, - "train/negative_loss": 0.26307740807533264, - "train/num_negatives": 36, - "train/num_positives": 10, - "train/positive_loss": 0.000543176953215152, - "train/total_loss": 0.14101003110408783 - }, - { - "epoch": 17.11026615969582, - "step": 4500, - "train/classification_loss": 0.08216880261898041, - "train/contrastive_loss": 0.12179805338382721, - "train/negative_loss": 0.1217912808060646, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 6.775090696464758e-06, - "train/total_loss": 0.10652841627597809 - }, - { - "epoch": 17.30038022813688, - "grad_norm": 8.554377555847168, - "learning_rate": 1.9323287671232878e-05, - "loss": 0.4024, - "step": 4550 - }, - { - "epoch": 17.30038022813688, - "step": 4550, - "train/classification_loss": 0.041233744472265244, - "train/contrastive_loss": 0.27006372809410095, - "train/negative_loss": 0.26257723569869995, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.0074864961206912994, - "train/total_loss": 0.09524649381637573 - }, - { - "epoch": 17.30038022813688, - "step": 4550, - "train/classification_loss": 0.05310553312301636, - "train/contrastive_loss": 0.16828250885009766, - "train/negative_loss": 0.16062286496162415, - "train/num_negatives": 32, - "train/num_positives": 20, - "train/positive_loss": 0.007659647148102522, - "train/total_loss": 0.08676204085350037 - }, - { - "epoch": 17.490494296577946, - "grad_norm": 8.103089332580566, - "learning_rate": 1.9315677321156773e-05, - "loss": 0.3565, - "step": 4600 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.36089780926704407, - "train/contrastive_loss": 3.2707395553588867, - "train/negative_loss": 0.7763468027114868, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.4943928718566895, - "train/total_loss": 1.0150457620620728 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.12697497010231018, - "train/contrastive_loss": 1.5984954833984375, - "train/negative_loss": 1.1001698970794678, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.49832552671432495, - "train/total_loss": 0.44667407870292664 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.19753940403461456, - "train/contrastive_loss": 0.9573248624801636, - "train/negative_loss": 0.18739470839500427, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.7699301838874817, - "train/total_loss": 0.3890043795108795 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.24273653328418732, - "train/contrastive_loss": 2.842918634414673, - "train/negative_loss": 1.4366389513015747, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.4062796831130981, - "train/total_loss": 0.8113202452659607 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.08935242891311646, - "train/contrastive_loss": 1.4627916812896729, - "train/negative_loss": 1.2288185358047485, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.23397308588027954, - "train/total_loss": 0.3819107711315155 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.20168666541576385, - "train/contrastive_loss": 3.124734878540039, - "train/negative_loss": 1.4110008478164673, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.7137341499328613, - "train/total_loss": 0.8266336917877197 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.21878083050251007, - "train/contrastive_loss": 3.176151752471924, - "train/negative_loss": 1.9299118518829346, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.2462399005889893, - "train/total_loss": 0.8540111780166626 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.12916721403598785, - "train/contrastive_loss": 2.1248793601989746, - "train/negative_loss": 1.1355063915252686, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9893728494644165, - "train/total_loss": 0.5541430711746216 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1485709249973297, - "train/contrastive_loss": 0.8652650117874146, - "train/negative_loss": 0.834801435470581, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.030463552102446556, - "train/total_loss": 0.32162392139434814 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.3333165943622589, - "train/contrastive_loss": 2.664935350418091, - "train/negative_loss": 1.4102535247802734, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2546818256378174, - "train/total_loss": 0.8663036823272705 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.18664491176605225, - "train/contrastive_loss": 2.8398332595825195, - "train/negative_loss": 1.5626252889633179, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.2772080898284912, - "train/total_loss": 0.7546115517616272 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.11164135485887527, - "train/contrastive_loss": 1.571216344833374, - "train/negative_loss": 0.6169759631156921, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9542403221130371, - "train/total_loss": 0.4258846342563629 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.18136605620384216, - "train/contrastive_loss": 3.690124273300171, - "train/negative_loss": 1.829322338104248, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.8608019351959229, - "train/total_loss": 0.9193909168243408 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.08700645714998245, - "train/contrastive_loss": 2.120159864425659, - "train/negative_loss": 2.120063304901123, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 9.666570258559659e-05, - "train/total_loss": 0.5110384225845337 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.11481256783008575, - "train/contrastive_loss": 2.5801963806152344, - "train/negative_loss": 0.7973760962486267, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.7828203439712524, - "train/total_loss": 0.6308518648147583 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.14045991003513336, - "train/contrastive_loss": 0.9381479620933533, - "train/negative_loss": 0.5404318571090698, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.39771610498428345, - "train/total_loss": 0.32808950543403625 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.26307547092437744, - "train/contrastive_loss": 1.8845291137695312, - "train/negative_loss": 0.7072657942771912, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.1772632598876953, - "train/total_loss": 0.6399812698364258 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1990024298429489, - "train/contrastive_loss": 1.5993996858596802, - "train/negative_loss": 0.5764071941375732, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.022992491722107, - "train/total_loss": 0.5188823938369751 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.2085309624671936, - "train/contrastive_loss": 0.9132332801818848, - "train/negative_loss": 0.4921282231807709, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.4211050868034363, - "train/total_loss": 0.39117762446403503 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.14648926258087158, - "train/contrastive_loss": 1.6887047290802002, - "train/negative_loss": 0.5891973972320557, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.0995073318481445, - "train/total_loss": 0.4842302203178406 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.2057667374610901, - "train/contrastive_loss": 1.5011626482009888, - "train/negative_loss": 0.29666876792907715, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.2044938802719116, - "train/total_loss": 0.5059992671012878 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.24079379439353943, - "train/contrastive_loss": 1.760134220123291, - "train/negative_loss": 0.8332087993621826, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.9269254207611084, - "train/total_loss": 0.5928206443786621 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.10657858848571777, - "train/contrastive_loss": 1.069412112236023, - "train/negative_loss": 0.20628678798675537, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.8631253242492676, - "train/total_loss": 0.3204610347747803 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1571383774280548, - "train/contrastive_loss": 1.015452265739441, - "train/negative_loss": 0.11613786965608597, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.8993144035339355, - "train/total_loss": 0.36022883653640747 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.06945175677537918, - "train/contrastive_loss": 0.6514001488685608, - "train/negative_loss": 0.15579567849636078, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.4956044554710388, - "train/total_loss": 0.19973179697990417 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.3120441436767578, - "train/contrastive_loss": 1.7650909423828125, - "train/negative_loss": 0.2034302055835724, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.5616607666015625, - "train/total_loss": 0.6650623083114624 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.30057406425476074, - "train/contrastive_loss": 2.573275566101074, - "train/negative_loss": 1.514098048210144, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0591776371002197, - "train/total_loss": 0.8152291774749756 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.19660192728042603, - "train/contrastive_loss": 4.280754089355469, - "train/negative_loss": 3.0157015323638916, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.265052318572998, - "train/total_loss": 1.0527527332305908 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1772814691066742, - "train/contrastive_loss": 1.6392171382904053, - "train/negative_loss": 0.7947980165481567, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8444191217422485, - "train/total_loss": 0.5051249265670776 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.20886246860027313, - "train/contrastive_loss": 0.8602638244628906, - "train/negative_loss": 0.40623143315315247, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.45403239130973816, - "train/total_loss": 0.38091522455215454 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.09769244492053986, - "train/contrastive_loss": 1.8556865453720093, - "train/negative_loss": 0.7828247547149658, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 1.0728617906570435, - "train/total_loss": 0.4688297510147095 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.20590588450431824, - "train/contrastive_loss": 2.840975284576416, - "train/negative_loss": 1.2203906774520874, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.620584487915039, - "train/total_loss": 0.7741008996963501 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.2417968064546585, - "train/contrastive_loss": 0.6455224752426147, - "train/negative_loss": 0.6451660990715027, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00035638007102534175, - "train/total_loss": 0.37090128660202026 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1620139181613922, - "train/contrastive_loss": 0.585523247718811, - "train/negative_loss": 0.49531978368759155, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.09020344913005829, - "train/total_loss": 0.2791185677051544 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.22004972398281097, - "train/contrastive_loss": 3.0611023902893066, - "train/negative_loss": 2.4406628608703613, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.6204394102096558, - "train/total_loss": 0.8322702050209045 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.183002769947052, - "train/contrastive_loss": 3.1424875259399414, - "train/negative_loss": 1.1393483877182007, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.0031392574310303, - "train/total_loss": 0.8115003108978271 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.11358154565095901, - "train/contrastive_loss": 1.5040924549102783, - "train/negative_loss": 1.0897960662841797, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.41429635882377625, - "train/total_loss": 0.41440004110336304 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.16030636429786682, - "train/contrastive_loss": 1.0832188129425049, - "train/negative_loss": 0.7874190211296082, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.2957998514175415, - "train/total_loss": 0.37695014476776123 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.18111000955104828, - "train/contrastive_loss": 0.9511035680770874, - "train/negative_loss": 0.9505124688148499, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.0005910899490118027, - "train/total_loss": 0.37133073806762695 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.19436950981616974, - "train/contrastive_loss": 2.1629140377044678, - "train/negative_loss": 2.149782657623291, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.013131329789757729, - "train/total_loss": 0.6269523501396179 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.20367556810379028, - "train/contrastive_loss": 2.010071277618408, - "train/negative_loss": 1.1804280281066895, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.829643189907074, - "train/total_loss": 0.6056898236274719 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.19035367667675018, - "train/contrastive_loss": 2.2636961936950684, - "train/negative_loss": 1.585236668586731, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.6784594655036926, - "train/total_loss": 0.643092930316925 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.2138860672712326, - "train/contrastive_loss": 2.244418144226074, - "train/negative_loss": 0.6884671449661255, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5559511184692383, - "train/total_loss": 0.6627696752548218 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.19661179184913635, - "train/contrastive_loss": 2.381340980529785, - "train/negative_loss": 1.235967993736267, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.145372986793518, - "train/total_loss": 0.6728799939155579 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.11122805625200272, - "train/contrastive_loss": 1.486335277557373, - "train/negative_loss": 0.737412691116333, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.74892258644104, - "train/total_loss": 0.40849509835243225 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.24814173579216003, - "train/contrastive_loss": 0.883456826210022, - "train/negative_loss": 0.6630691289901733, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.22038768231868744, - "train/total_loss": 0.42483311891555786 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.10568113625049591, - "train/contrastive_loss": 0.5925672054290771, - "train/negative_loss": 0.5918726921081543, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.0006945374188944697, - "train/total_loss": 0.22419458627700806 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.11776351928710938, - "train/contrastive_loss": 1.1348716020584106, - "train/negative_loss": 0.32110247015953064, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8137691020965576, - "train/total_loss": 0.34473782777786255 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.08172590285539627, - "train/contrastive_loss": 0.8747919201850891, - "train/negative_loss": 0.8638182878494263, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.010973620228469372, - "train/total_loss": 0.2566843032836914 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.15076802670955658, - "train/contrastive_loss": 0.7215332984924316, - "train/negative_loss": 0.11892375349998474, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.6026095747947693, - "train/total_loss": 0.2950747013092041 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.12454832345247269, - "train/contrastive_loss": 1.6975034475326538, - "train/negative_loss": 0.3521241843700409, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.3453792333602905, - "train/total_loss": 0.46404901146888733 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.14368261396884918, - "train/contrastive_loss": 0.5205967426300049, - "train/negative_loss": 0.32626238465309143, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.19433435797691345, - "train/total_loss": 0.24780195951461792 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1981779783964157, - "train/contrastive_loss": 1.02780282497406, - "train/negative_loss": 0.6181772351264954, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4096255600452423, - "train/total_loss": 0.4037385582923889 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.22867166996002197, - "train/contrastive_loss": 3.177244186401367, - "train/negative_loss": 2.650054693222046, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.5271895527839661, - "train/total_loss": 0.8641205430030823 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.18615268170833588, - "train/contrastive_loss": 1.2411612272262573, - "train/negative_loss": 0.37011823058128357, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.8710430264472961, - "train/total_loss": 0.43438494205474854 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.17009221017360687, - "train/contrastive_loss": 2.9826345443725586, - "train/negative_loss": 1.791677713394165, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1909568309783936, - "train/total_loss": 0.7666191458702087 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.30014991760253906, - "train/contrastive_loss": 3.904078960418701, - "train/negative_loss": 1.7056301832199097, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.198448896408081, - "train/total_loss": 1.0809657573699951 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.24679511785507202, - "train/contrastive_loss": 3.820739984512329, - "train/negative_loss": 2.114885091781616, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.705854892730713, - "train/total_loss": 1.0109431743621826 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.14452393352985382, - "train/contrastive_loss": 1.6334601640701294, - "train/negative_loss": 0.6270796060562134, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.006380558013916, - "train/total_loss": 0.47121596336364746 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.24911555647850037, - "train/contrastive_loss": 3.5518271923065186, - "train/negative_loss": 1.61606764793396, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.9357595443725586, - "train/total_loss": 0.9594810009002686 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.29985734820365906, - "train/contrastive_loss": 4.3486480712890625, - "train/negative_loss": 3.065412998199463, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.2832350730895996, - "train/total_loss": 1.1695870161056519 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.298429936170578, - "train/contrastive_loss": 2.8859546184539795, - "train/negative_loss": 1.444532036781311, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.4414225816726685, - "train/total_loss": 0.8756208419799805 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.1314956396818161, - "train/contrastive_loss": 0.5782631039619446, - "train/negative_loss": 0.5781813859939575, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 8.172458183253184e-05, - "train/total_loss": 0.24714826047420502 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.17731308937072754, - "train/contrastive_loss": 1.3056085109710693, - "train/negative_loss": 0.5409131050109863, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7646954655647278, - "train/total_loss": 0.43843480944633484 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.108541339635849, - "train/contrastive_loss": 1.4958558082580566, - "train/negative_loss": 0.5673199892044067, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.9285358190536499, - "train/total_loss": 0.40771251916885376 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.16879431903362274, - "train/contrastive_loss": 1.6647754907608032, - "train/negative_loss": 1.6647754907608032, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5017493963241577 - }, - { - "epoch": 17.490494296577946, - "eval_exact_match_accuracy": 0.3504761904761905, - "eval_hamming_loss": 0.06352941176470588, - "eval_loss": 0.5712664723396301, - "eval_macro_f1": 0.45233784233004665, - "eval_macro_precision": 0.5964940603373698, - "eval_macro_recall": 0.38538342368426204, - "eval_micro_f1": 0.6217478318879253, - "eval_micro_precision": 0.7516129032258064, - "eval_micro_recall": 0.5301478953356087, - "eval_runtime": 2.6352, - "eval_samples_per_second": 199.229, - "eval_steps_per_second": 25.046, - "step": 4600 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.13913093507289886, - "train/contrastive_loss": 0.7668935060501099, - "train/negative_loss": 0.43982869386672974, - "train/num_negatives": 42, - "train/num_positives": 6, - "train/positive_loss": 0.3270648121833801, - "train/total_loss": 0.29250964522361755 - }, - { - "epoch": 17.490494296577946, - "step": 4600, - "train/classification_loss": 0.08646177500486374, - "train/contrastive_loss": 0.6336468458175659, - "train/negative_loss": 0.6225364208221436, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.011110448278486729, - "train/total_loss": 0.21319115161895752 - }, - { - "epoch": 17.680608365019012, - "grad_norm": 4.3980302810668945, - "learning_rate": 1.930806697108067e-05, - "loss": 0.3799, - "step": 4650 - }, - { - "epoch": 17.680608365019012, - "step": 4650, - "train/classification_loss": 0.08132649213075638, - "train/contrastive_loss": 0.48385924100875854, - "train/negative_loss": 0.4838034212589264, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 5.583195525105111e-05, - "train/total_loss": 0.17809835076332092 - }, - { - "epoch": 17.680608365019012, - "step": 4650, - "train/classification_loss": 0.09166789054870605, - "train/contrastive_loss": 0.45400741696357727, - "train/negative_loss": 0.19445374608039856, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.2595536708831787, - "train/total_loss": 0.18246936798095703 - }, - { - "epoch": 17.870722433460077, - "grad_norm": 2.9037811756134033, - "learning_rate": 1.930045662100457e-05, - "loss": 0.3917, - "step": 4700 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.3542347550392151, - "train/contrastive_loss": 2.5558972358703613, - "train/negative_loss": 0.3795410692691803, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.176356077194214, - "train/total_loss": 0.8654142022132874 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.13123458623886108, - "train/contrastive_loss": 1.639920949935913, - "train/negative_loss": 1.1459195613861084, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.49400144815444946, - "train/total_loss": 0.4592187702655792 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18492592871189117, - "train/contrastive_loss": 1.0866577625274658, - "train/negative_loss": 0.4077554941177368, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.678902268409729, - "train/total_loss": 0.40225750207901 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.24905173480510712, - "train/contrastive_loss": 3.554521083831787, - "train/negative_loss": 2.3932790756225586, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.161241888999939, - "train/total_loss": 0.9599559903144836 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.0940665677189827, - "train/contrastive_loss": 1.1487681865692139, - "train/negative_loss": 0.7780058979988098, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.3707622289657593, - "train/total_loss": 0.32382020354270935 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.1881561577320099, - "train/contrastive_loss": 1.7612375020980835, - "train/negative_loss": 1.1784836053848267, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.5827538967132568, - "train/total_loss": 0.5404036641120911 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.20507021248340607, - "train/contrastive_loss": 2.2535367012023926, - "train/negative_loss": 1.1239439249038696, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.1295928955078125, - "train/total_loss": 0.6557775735855103 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11896880716085434, - "train/contrastive_loss": 1.4289947748184204, - "train/negative_loss": 1.0481364727020264, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.38085827231407166, - "train/total_loss": 0.404767781496048 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.15212321281433105, - "train/contrastive_loss": 0.9163507223129272, - "train/negative_loss": 0.9036896824836731, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.012661050073802471, - "train/total_loss": 0.33539336919784546 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.3757459819316864, - "train/contrastive_loss": 2.738154411315918, - "train/negative_loss": 1.471732258796692, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2664222717285156, - "train/total_loss": 0.9233769178390503 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.15081831812858582, - "train/contrastive_loss": 2.5618577003479004, - "train/negative_loss": 1.5394541025161743, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.022403597831726, - "train/total_loss": 0.6631898880004883 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.12339582294225693, - "train/contrastive_loss": 2.4571142196655273, - "train/negative_loss": 1.282004952430725, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.1751093864440918, - "train/total_loss": 0.6148186922073364 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.19941996037960052, - "train/contrastive_loss": 3.838411331176758, - "train/negative_loss": 1.7958935499191284, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 2.04251766204834, - "train/total_loss": 0.9671022295951843 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.0834556445479393, - "train/contrastive_loss": 2.146494150161743, - "train/negative_loss": 2.1464462280273438, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 4.8004603740992025e-05, - "train/total_loss": 0.512754499912262 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11700427532196045, - "train/contrastive_loss": 1.9130001068115234, - "train/negative_loss": 0.6942372918128967, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.218762755393982, - "train/total_loss": 0.49960431456565857 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.13261473178863525, - "train/contrastive_loss": 0.49156510829925537, - "train/negative_loss": 0.4778570532798767, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.013708067126572132, - "train/total_loss": 0.23092776536941528 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.24762433767318726, - "train/contrastive_loss": 2.2400894165039062, - "train/negative_loss": 1.3662312030792236, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8738583326339722, - "train/total_loss": 0.6956422328948975 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18046945333480835, - "train/contrastive_loss": 1.0532780885696411, - "train/negative_loss": 0.3416849672794342, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7115930914878845, - "train/total_loss": 0.3911250829696655 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.20235086977481842, - "train/contrastive_loss": 1.80985689163208, - "train/negative_loss": 1.243823766708374, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.5660331845283508, - "train/total_loss": 0.5643222332000732 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11936695128679276, - "train/contrastive_loss": 1.0033936500549316, - "train/negative_loss": 0.4356115460395813, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.5677821636199951, - "train/total_loss": 0.32004567980766296 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.2483135461807251, - "train/contrastive_loss": 1.621165156364441, - "train/negative_loss": 0.21796564757823944, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.403199553489685, - "train/total_loss": 0.5725466012954712 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.2290140837430954, - "train/contrastive_loss": 1.7325589656829834, - "train/negative_loss": 0.7822895050048828, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.9502695202827454, - "train/total_loss": 0.5755258798599243 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.08455225080251694, - "train/contrastive_loss": 0.5525155067443848, - "train/negative_loss": 0.20650112628936768, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.3460143804550171, - "train/total_loss": 0.19505535066127777 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.16164834797382355, - "train/contrastive_loss": 0.4335736334323883, - "train/negative_loss": 0.3167395293712616, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.11683410406112671, - "train/total_loss": 0.24836307764053345 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.06375754624605179, - "train/contrastive_loss": 0.6654332876205444, - "train/negative_loss": 0.2647901177406311, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.4006431996822357, - "train/total_loss": 0.196844220161438 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.332409530878067, - "train/contrastive_loss": 1.4340050220489502, - "train/negative_loss": 0.2970395088195801, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1369655132293701, - "train/total_loss": 0.6192105412483215 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.30402669310569763, - "train/contrastive_loss": 2.971123218536377, - "train/negative_loss": 1.6555379629135132, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3155851364135742, - "train/total_loss": 0.8982512950897217 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18367554247379303, - "train/contrastive_loss": 4.085911273956299, - "train/negative_loss": 3.1322691440582275, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.9536420106887817, - "train/total_loss": 1.0008578300476074 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.19229164719581604, - "train/contrastive_loss": 1.457464337348938, - "train/negative_loss": 0.8025166392326355, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.6549476981163025, - "train/total_loss": 0.4837845265865326 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.1951485127210617, - "train/contrastive_loss": 0.8098751306533813, - "train/negative_loss": 0.5058203935623169, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.30405470728874207, - "train/total_loss": 0.35712355375289917 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.09216257184743881, - "train/contrastive_loss": 0.5916066765785217, - "train/negative_loss": 0.19572892785072327, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.39587774872779846, - "train/total_loss": 0.21048390865325928 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.19125662744045258, - "train/contrastive_loss": 2.4058074951171875, - "train/negative_loss": 1.264951467514038, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1408559083938599, - "train/total_loss": 0.6724181175231934 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.19430893659591675, - "train/contrastive_loss": 0.5473577976226807, - "train/negative_loss": 0.5473304986953735, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 2.7299300199956633e-05, - "train/total_loss": 0.3037804961204529 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.1591276079416275, - "train/contrastive_loss": 0.8403200507164001, - "train/negative_loss": 0.6964396238327026, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.1438804268836975, - "train/total_loss": 0.32719162106513977 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.21852077543735504, - "train/contrastive_loss": 3.6873373985290527, - "train/negative_loss": 2.7589073181152344, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.9284301996231079, - "train/total_loss": 0.9559882283210754 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18816697597503662, - "train/contrastive_loss": 3.0830225944519043, - "train/negative_loss": 1.4033398628234863, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.6796826124191284, - "train/total_loss": 0.8047714829444885 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.10695578157901764, - "train/contrastive_loss": 0.5867024660110474, - "train/negative_loss": 0.4609006643295288, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.12580180168151855, - "train/total_loss": 0.22429627180099487 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.15092873573303223, - "train/contrastive_loss": 0.8782252073287964, - "train/negative_loss": 0.8782058954238892, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 1.9312092263135128e-05, - "train/total_loss": 0.32657378911972046 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18800987303256989, - "train/contrastive_loss": 1.3189928531646729, - "train/negative_loss": 1.317729115486145, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.0012636814499273896, - "train/total_loss": 0.45180845260620117 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.20317016541957855, - "train/contrastive_loss": 2.3232100009918213, - "train/negative_loss": 2.322451114654541, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0007589358137920499, - "train/total_loss": 0.667812168598175 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.16531087458133698, - "train/contrastive_loss": 1.2114291191101074, - "train/negative_loss": 0.9081498384475708, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.30327922105789185, - "train/total_loss": 0.4075967073440552 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.17659416794776917, - "train/contrastive_loss": 2.434370279312134, - "train/negative_loss": 1.8505276441574097, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.5838426351547241, - "train/total_loss": 0.6634682416915894 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.20540596544742584, - "train/contrastive_loss": 1.3956860303878784, - "train/negative_loss": 0.2798050343990326, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.1158809661865234, - "train/total_loss": 0.48454320430755615 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.16188974678516388, - "train/contrastive_loss": 2.179929256439209, - "train/negative_loss": 1.0740712881088257, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.1058579683303833, - "train/total_loss": 0.5978755950927734 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11287809908390045, - "train/contrastive_loss": 0.8696467876434326, - "train/negative_loss": 0.4293334484100342, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.44031333923339844, - "train/total_loss": 0.28680747747421265 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.28814804553985596, - "train/contrastive_loss": 0.6101537942886353, - "train/negative_loss": 0.35342082381248474, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.2567330002784729, - "train/total_loss": 0.4101788103580475 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.10213731229305267, - "train/contrastive_loss": 0.7775403261184692, - "train/negative_loss": 0.7775377035140991, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.5928068225766765e-06, - "train/total_loss": 0.2576453685760498 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.10541747510433197, - "train/contrastive_loss": 0.7871649265289307, - "train/negative_loss": 0.16447070240974426, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.6226942539215088, - "train/total_loss": 0.26285046339035034 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.08775049448013306, - "train/contrastive_loss": 1.1143922805786133, - "train/negative_loss": 1.1091806888580322, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.005211647134274244, - "train/total_loss": 0.3106289505958557 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.15152643620967865, - "train/contrastive_loss": 0.8111494183540344, - "train/negative_loss": 0.6849755644798279, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.12617383897304535, - "train/total_loss": 0.3137563169002533 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11847944557666779, - "train/contrastive_loss": 1.2870850563049316, - "train/negative_loss": 0.2884431481361389, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.998641848564148, - "train/total_loss": 0.3758964538574219 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.13356579840183258, - "train/contrastive_loss": 0.4443674087524414, - "train/negative_loss": 0.1728215366601944, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.2715458869934082, - "train/total_loss": 0.22243928909301758 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.19421212375164032, - "train/contrastive_loss": 0.8402777910232544, - "train/negative_loss": 0.5592202544212341, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.28105756640434265, - "train/total_loss": 0.3622676730155945 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.21190589666366577, - "train/contrastive_loss": 3.2864630222320557, - "train/negative_loss": 2.474865436553955, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8115976452827454, - "train/total_loss": 0.8691985011100769 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11110832542181015, - "train/contrastive_loss": 0.22732429206371307, - "train/negative_loss": 0.12762294709682465, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.09970134496688843, - "train/total_loss": 0.15657317638397217 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.16439379751682281, - "train/contrastive_loss": 2.5303072929382324, - "train/negative_loss": 1.6310787200927734, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.899228572845459, - "train/total_loss": 0.670455276966095 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.3074919581413269, - "train/contrastive_loss": 3.9899239540100098, - "train/negative_loss": 1.590984582901001, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.398939371109009, - "train/total_loss": 1.1054767370224 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.25087910890579224, - "train/contrastive_loss": 3.772274971008301, - "train/negative_loss": 1.7718003988265991, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 2.000474691390991, - "train/total_loss": 1.0053341388702393 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.14321136474609375, - "train/contrastive_loss": 1.7315396070480347, - "train/negative_loss": 1.5204880237579346, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.21105162799358368, - "train/total_loss": 0.48951929807662964 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.24586139619350433, - "train/contrastive_loss": 3.454685688018799, - "train/negative_loss": 1.6302616596221924, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.824424147605896, - "train/total_loss": 0.9367985725402832 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.2769038677215576, - "train/contrastive_loss": 5.26125431060791, - "train/negative_loss": 4.315311908721924, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9459422826766968, - "train/total_loss": 1.3291547298431396 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.2980262339115143, - "train/contrastive_loss": 2.9018447399139404, - "train/negative_loss": 1.628287434577942, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.2735573053359985, - "train/total_loss": 0.8783951997756958 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.10505229979753494, - "train/contrastive_loss": 0.2664782404899597, - "train/negative_loss": 0.2664755582809448, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 2.6822144718607888e-06, - "train/total_loss": 0.158347949385643 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.18170668184757233, - "train/contrastive_loss": 1.5119987726211548, - "train/negative_loss": 0.8086231350898743, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.7033756375312805, - "train/total_loss": 0.4841064214706421 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.11351145803928375, - "train/contrastive_loss": 1.2525701522827148, - "train/negative_loss": 0.5797364115715027, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.6728338003158569, - "train/total_loss": 0.3640254735946655 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.16587917506694794, - "train/contrastive_loss": 1.536336064338684, - "train/negative_loss": 1.536336064338684, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.47314637899398804 - }, - { - "epoch": 17.870722433460077, - "eval_exact_match_accuracy": 0.36, - "eval_hamming_loss": 0.061512605042016805, - "eval_loss": 0.5351871848106384, - "eval_macro_f1": 0.4544672169542387, - "eval_macro_precision": 0.6235844712604802, - "eval_macro_recall": 0.3837451184492209, - "eval_micro_f1": 0.6361829025844931, - "eval_micro_precision": 0.7619047619047619, - "eval_micro_recall": 0.5460750853242321, - "eval_runtime": 2.6306, - "eval_samples_per_second": 199.573, - "eval_steps_per_second": 25.089, - "step": 4700 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.06918200850486755, - "train/contrastive_loss": 0.5445549488067627, - "train/negative_loss": 0.5442155003547668, - "train/num_negatives": 40, - "train/num_positives": 8, - "train/positive_loss": 0.0003394644008949399, - "train/total_loss": 0.17809300124645233 - }, - { - "epoch": 17.870722433460077, - "step": 4700, - "train/classification_loss": 0.07595794647932053, - "train/contrastive_loss": 0.208000048995018, - "train/negative_loss": 0.1672411412000656, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.040758904069662094, - "train/total_loss": 0.11755795776844025 - }, - { - "epoch": 18.06083650190114, - "grad_norm": 9.827784538269043, - "learning_rate": 1.9292846270928464e-05, - "loss": 0.3581, - "step": 4750 - }, - { - "epoch": 18.06083650190114, - "step": 4750, - "train/classification_loss": 0.034342601895332336, - "train/contrastive_loss": 0.30236372351646423, - "train/negative_loss": 0.2715160548686981, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.030847668647766113, - "train/total_loss": 0.09481534361839294 - }, - { - "epoch": 18.06083650190114, - "step": 4750, - "train/classification_loss": 0.035669438540935516, - "train/contrastive_loss": 0.2092803567647934, - "train/negative_loss": 0.207768052816391, - "train/num_negatives": 24, - "train/num_positives": 32, - "train/positive_loss": 0.001512301852926612, - "train/total_loss": 0.07752551138401031 - }, - { - "epoch": 18.250950570342205, - "grad_norm": 7.188684463500977, - "learning_rate": 1.9285235920852362e-05, - "loss": 0.3546, - "step": 4800 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.331603080034256, - "train/contrastive_loss": 2.6494905948638916, - "train/negative_loss": 0.6810959577560425, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.9683946371078491, - "train/total_loss": 0.8615012168884277 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11761737614870071, - "train/contrastive_loss": 1.4812886714935303, - "train/negative_loss": 0.975277841091156, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.506010890007019, - "train/total_loss": 0.41387510299682617 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.17516569793224335, - "train/contrastive_loss": 1.5543181896209717, - "train/negative_loss": 0.7049735188484192, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.8493447303771973, - "train/total_loss": 0.48602932691574097 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.2265671044588089, - "train/contrastive_loss": 2.2886109352111816, - "train/negative_loss": 1.347399115562439, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9412119388580322, - "train/total_loss": 0.684289276599884 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.10264694690704346, - "train/contrastive_loss": 1.5306949615478516, - "train/negative_loss": 1.1034092903137207, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.42728573083877563, - "train/total_loss": 0.40878593921661377 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.2011488974094391, - "train/contrastive_loss": 1.3580821752548218, - "train/negative_loss": 0.9365049600601196, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.42157718539237976, - "train/total_loss": 0.47276532649993896 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.21534714102745056, - "train/contrastive_loss": 2.5193991661071777, - "train/negative_loss": 0.9392468929290771, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.5801522731781006, - "train/total_loss": 0.7192269563674927 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1195756122469902, - "train/contrastive_loss": 1.0080420970916748, - "train/negative_loss": 0.9733359217643738, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.03470619395375252, - "train/total_loss": 0.32118403911590576 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.16276182234287262, - "train/contrastive_loss": 2.666369676589966, - "train/negative_loss": 1.5120325088500977, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.1543371677398682, - "train/total_loss": 0.6960357427597046 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.33087265491485596, - "train/contrastive_loss": 3.2297720909118652, - "train/negative_loss": 1.4341272115707397, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.795644998550415, - "train/total_loss": 0.976827085018158 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.16463275253772736, - "train/contrastive_loss": 2.809701442718506, - "train/negative_loss": 1.6920044422149658, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 1.1176968812942505, - "train/total_loss": 0.7265730500221252 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11630858480930328, - "train/contrastive_loss": 1.8506994247436523, - "train/negative_loss": 1.2618563175201416, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.588843047618866, - "train/total_loss": 0.4864484667778015 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1825246512889862, - "train/contrastive_loss": 3.169342517852783, - "train/negative_loss": 1.9027804136276245, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.2665619850158691, - "train/total_loss": 0.8163931369781494 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.09905196726322174, - "train/contrastive_loss": 2.31846284866333, - "train/negative_loss": 2.317793130874634, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0006696029449813068, - "train/total_loss": 0.5627445578575134 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.10598786920309067, - "train/contrastive_loss": 2.287867546081543, - "train/negative_loss": 0.8130369186401367, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.4748305082321167, - "train/total_loss": 0.5635613799095154 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.12754568457603455, - "train/contrastive_loss": 0.48062440752983093, - "train/negative_loss": 0.23615378141403198, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.24447062611579895, - "train/total_loss": 0.2236705720424652 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.24277964234352112, - "train/contrastive_loss": 1.996071696281433, - "train/negative_loss": 1.1698458194732666, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8262258768081665, - "train/total_loss": 0.6419939994812012 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.20283447206020355, - "train/contrastive_loss": 1.950344204902649, - "train/negative_loss": 0.7129863500595093, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 1.2373578548431396, - "train/total_loss": 0.5929033160209656 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.20940160751342773, - "train/contrastive_loss": 1.9679789543151855, - "train/negative_loss": 1.58137047290802, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.3866085410118103, - "train/total_loss": 0.6029974222183228 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11620332300662994, - "train/contrastive_loss": 1.4151098728179932, - "train/negative_loss": 0.21599271893501282, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.1991171836853027, - "train/total_loss": 0.39922529458999634 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.24620062112808228, - "train/contrastive_loss": 1.9143874645233154, - "train/negative_loss": 0.4137175977230072, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.5006698369979858, - "train/total_loss": 0.6290781497955322 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.24876606464385986, - "train/contrastive_loss": 2.818237781524658, - "train/negative_loss": 0.8961740136146545, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 1.9220637083053589, - "train/total_loss": 0.8124136328697205 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.10341156274080276, - "train/contrastive_loss": 1.3266563415527344, - "train/negative_loss": 0.7607670426368713, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.565889298915863, - "train/total_loss": 0.36874282360076904 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1726466864347458, - "train/contrastive_loss": 1.1093937158584595, - "train/negative_loss": 0.44503721594810486, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.6643564701080322, - "train/total_loss": 0.3945254385471344 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.09586133062839508, - "train/contrastive_loss": 2.1205358505249023, - "train/negative_loss": 0.7768318057060242, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.3437039852142334, - "train/total_loss": 0.5199685096740723 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.3460414707660675, - "train/contrastive_loss": 1.7116007804870605, - "train/negative_loss": 0.4379314184188843, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.2736693620681763, - "train/total_loss": 0.688361644744873 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.266736775636673, - "train/contrastive_loss": 3.2290358543395996, - "train/negative_loss": 1.5748244524002075, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.6542112827301025, - "train/total_loss": 0.9125440120697021 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.21682992577552795, - "train/contrastive_loss": 4.319581031799316, - "train/negative_loss": 3.1854777336120605, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.1341032981872559, - "train/total_loss": 1.0807461738586426 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.2095957100391388, - "train/contrastive_loss": 1.4384862184524536, - "train/negative_loss": 0.8907774090766907, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5477088093757629, - "train/total_loss": 0.49729296565055847 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.20714791119098663, - "train/contrastive_loss": 1.3822576999664307, - "train/negative_loss": 1.0548171997070312, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.327440470457077, - "train/total_loss": 0.4835994839668274 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.10279487818479538, - "train/contrastive_loss": 1.157896637916565, - "train/negative_loss": 0.3681011199951172, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7897955179214478, - "train/total_loss": 0.33437421917915344 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1965377777814865, - "train/contrastive_loss": 2.883314609527588, - "train/negative_loss": 1.5824668407440186, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3008477687835693, - "train/total_loss": 0.7732007503509521 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.25175076723098755, - "train/contrastive_loss": 0.8984617590904236, - "train/negative_loss": 0.8984315991401672, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 3.0160405003698543e-05, - "train/total_loss": 0.43144312500953674 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.22946013510227203, - "train/contrastive_loss": 2.4730114936828613, - "train/negative_loss": 0.7119591236114502, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.7610524892807007, - "train/total_loss": 0.724062442779541 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.204443097114563, - "train/contrastive_loss": 3.1836695671081543, - "train/negative_loss": 2.8906233310699463, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.293046236038208, - "train/total_loss": 0.8411770462989807 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.17815837264060974, - "train/contrastive_loss": 2.8755199909210205, - "train/negative_loss": 1.1746509075164795, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.700869083404541, - "train/total_loss": 0.7532624006271362 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.12882770597934723, - "train/contrastive_loss": 0.8699408769607544, - "train/negative_loss": 0.7200595736503601, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.1498813033103943, - "train/total_loss": 0.30281588435173035 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.17469269037246704, - "train/contrastive_loss": 1.1553187370300293, - "train/negative_loss": 1.065568208694458, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.08975056558847427, - "train/total_loss": 0.4057564437389374 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1692187488079071, - "train/contrastive_loss": 1.4497369527816772, - "train/negative_loss": 1.4488955736160278, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.0008413207251578569, - "train/total_loss": 0.45916613936424255 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1888863444328308, - "train/contrastive_loss": 2.3610737323760986, - "train/negative_loss": 2.359647274017334, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0014264022465795279, - "train/total_loss": 0.6611011028289795 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.18832927942276, - "train/contrastive_loss": 1.7278891801834106, - "train/negative_loss": 1.174952745437622, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.5529364347457886, - "train/total_loss": 0.5339071154594421 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1984800398349762, - "train/contrastive_loss": 2.724940538406372, - "train/negative_loss": 1.8242511749267578, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.900689423084259, - "train/total_loss": 0.743468165397644 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.18091750144958496, - "train/contrastive_loss": 1.960049033164978, - "train/negative_loss": 0.6479500532150269, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.3120989799499512, - "train/total_loss": 0.5729273557662964 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.16417354345321655, - "train/contrastive_loss": 2.2806859016418457, - "train/negative_loss": 0.7725016474723816, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.5081841945648193, - "train/total_loss": 0.6203107237815857 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.12239538878202438, - "train/contrastive_loss": 1.0079987049102783, - "train/negative_loss": 0.40749722719192505, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.600501537322998, - "train/total_loss": 0.3239951431751251 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.2647177278995514, - "train/contrastive_loss": 0.7609004378318787, - "train/negative_loss": 0.5212830305099487, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.23961739242076874, - "train/total_loss": 0.41689783334732056 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11213459074497223, - "train/contrastive_loss": 0.5322738289833069, - "train/negative_loss": 0.5322698950767517, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 3.933918378606904e-06, - "train/total_loss": 0.21858936548233032 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11503460258245468, - "train/contrastive_loss": 1.3469616174697876, - "train/negative_loss": 0.17937710881233215, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.1675845384597778, - "train/total_loss": 0.38442695140838623 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1105315238237381, - "train/contrastive_loss": 1.5244346857070923, - "train/negative_loss": 1.3878545761108398, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.13658013939857483, - "train/total_loss": 0.41541844606399536 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1424514204263687, - "train/contrastive_loss": 0.6999379396438599, - "train/negative_loss": 0.3318024277687073, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.368135541677475, - "train/total_loss": 0.2824389934539795 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.13326725363731384, - "train/contrastive_loss": 1.8014345169067383, - "train/negative_loss": 0.48431432247161865, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.3171201944351196, - "train/total_loss": 0.49355417490005493 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1405608355998993, - "train/contrastive_loss": 1.2068297863006592, - "train/negative_loss": 0.20051835477352142, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0063114166259766, - "train/total_loss": 0.3819267749786377 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.1972188651561737, - "train/contrastive_loss": 1.574549913406372, - "train/negative_loss": 1.0711274147033691, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.5034224390983582, - "train/total_loss": 0.5121288299560547 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.22566618025302887, - "train/contrastive_loss": 3.774103879928589, - "train/negative_loss": 3.168553590774536, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6055503487586975, - "train/total_loss": 0.9804869294166565 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.159120574593544, - "train/contrastive_loss": 0.8286087512969971, - "train/negative_loss": 0.2529771029949188, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5756316781044006, - "train/total_loss": 0.32484233379364014 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.19141367077827454, - "train/contrastive_loss": 3.1404800415039062, - "train/negative_loss": 1.9630200862884521, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.1774600744247437, - "train/total_loss": 0.819509744644165 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.3041161596775055, - "train/contrastive_loss": 3.6459712982177734, - "train/negative_loss": 1.3934377431869507, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.2525336742401123, - "train/total_loss": 1.0333104133605957 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.22768399119377136, - "train/contrastive_loss": 3.71974515914917, - "train/negative_loss": 1.733988642692566, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.9857566356658936, - "train/total_loss": 0.9716330766677856 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.15558010339736938, - "train/contrastive_loss": 2.071721315383911, - "train/negative_loss": 2.047428846359253, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.0242923591285944, - "train/total_loss": 0.5699243545532227 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.2570647597312927, - "train/contrastive_loss": 3.706409454345703, - "train/negative_loss": 1.4432986974716187, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.263110876083374, - "train/total_loss": 0.9983466863632202 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.3193044066429138, - "train/contrastive_loss": 6.117128849029541, - "train/negative_loss": 4.703335762023926, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.4137929677963257, - "train/total_loss": 1.5427300930023193 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.30722397565841675, - "train/contrastive_loss": 3.423389434814453, - "train/negative_loss": 1.6459499597549438, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.7774394750595093, - "train/total_loss": 0.9919018745422363 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.12652988731861115, - "train/contrastive_loss": 0.4528260827064514, - "train/negative_loss": 0.45282143354415894, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 4.649180027627153e-06, - "train/total_loss": 0.21709510684013367 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.14958028495311737, - "train/contrastive_loss": 1.1057460308074951, - "train/negative_loss": 0.42565515637397766, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.6800909042358398, - "train/total_loss": 0.3707295060157776 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.11477527767419815, - "train/contrastive_loss": 1.561047077178955, - "train/negative_loss": 0.5410037040710449, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 1.0200433731079102, - "train/total_loss": 0.4269846975803375 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.15697722136974335, - "train/contrastive_loss": 1.724382996559143, - "train/negative_loss": 1.724382996559143, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5018538236618042 - }, - { - "epoch": 18.250950570342205, - "eval_exact_match_accuracy": 0.32, - "eval_hamming_loss": 0.06565826330532212, - "eval_loss": 0.597208559513092, - "eval_macro_f1": 0.43924226594799765, - "eval_macro_precision": 0.5357932658401842, - "eval_macro_recall": 0.3825267818914722, - "eval_micro_f1": 0.613965744400527, - "eval_micro_precision": 0.729264475743349, - "eval_micro_recall": 0.5301478953356087, - "eval_runtime": 2.6355, - "eval_samples_per_second": 199.203, - "eval_steps_per_second": 25.043, - "step": 4800 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.07149739563465118, - "train/contrastive_loss": 0.3636605739593506, - "train/negative_loss": 0.36347079277038574, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.00018977929721586406, - "train/total_loss": 0.14422950148582458 - }, - { - "epoch": 18.250950570342205, - "step": 4800, - "train/classification_loss": 0.0931914672255516, - "train/contrastive_loss": 1.1679373979568481, - "train/negative_loss": 0.6970142126083374, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.47092315554618835, - "train/total_loss": 0.32677894830703735 - }, - { - "epoch": 18.44106463878327, - "grad_norm": 8.384060859680176, - "learning_rate": 1.9277625570776257e-05, - "loss": 0.3733, - "step": 4850 - }, - { - "epoch": 18.44106463878327, - "step": 4850, - "train/classification_loss": 0.05661606788635254, - "train/contrastive_loss": 0.2872365117073059, - "train/negative_loss": 0.28247401118278503, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 0.004762495867908001, - "train/total_loss": 0.11406336724758148 - }, - { - "epoch": 18.44106463878327, - "step": 4850, - "train/classification_loss": 0.0841854140162468, - "train/contrastive_loss": 0.8428009152412415, - "train/negative_loss": 0.3719601333141327, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.47084078192710876, - "train/total_loss": 0.2527455985546112 - }, - { - "epoch": 18.631178707224336, - "grad_norm": 1.6756900548934937, - "learning_rate": 1.9270015220700155e-05, - "loss": 0.3363, - "step": 4900 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.38409215211868286, - "train/contrastive_loss": 3.3051066398620605, - "train/negative_loss": 0.8783417344093323, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.426764965057373, - "train/total_loss": 1.0451135635375977 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.13226594030857086, - "train/contrastive_loss": 1.4866046905517578, - "train/negative_loss": 0.9528505206108093, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5337542295455933, - "train/total_loss": 0.42958688735961914 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.19825667142868042, - "train/contrastive_loss": 1.0154825448989868, - "train/negative_loss": 0.1078239306807518, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.907658576965332, - "train/total_loss": 0.4013531804084778 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.24957121908664703, - "train/contrastive_loss": 2.943563938140869, - "train/negative_loss": 1.6071940660476685, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.3363698720932007, - "train/total_loss": 0.8382840156555176 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.09042759239673615, - "train/contrastive_loss": 1.5586752891540527, - "train/negative_loss": 1.2689223289489746, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.2897529602050781, - "train/total_loss": 0.40216267108917236 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.2069336473941803, - "train/contrastive_loss": 1.7006258964538574, - "train/negative_loss": 1.1334284543991089, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.5671974420547485, - "train/total_loss": 0.5470588207244873 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.2594519257545471, - "train/contrastive_loss": 2.4397828578948975, - "train/negative_loss": 1.5729081630706787, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.8668747544288635, - "train/total_loss": 0.7474085092544556 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.12316692620515823, - "train/contrastive_loss": 0.8898402452468872, - "train/negative_loss": 0.8540713787078857, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.03576889634132385, - "train/total_loss": 0.30113497376441956 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.1570090651512146, - "train/contrastive_loss": 1.1151901483535767, - "train/negative_loss": 1.0985339879989624, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.016656123101711273, - "train/total_loss": 0.380047082901001 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.32549721002578735, - "train/contrastive_loss": 2.735520839691162, - "train/negative_loss": 1.260308861732483, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.4752120971679688, - "train/total_loss": 0.8726013898849487 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.15129950642585754, - "train/contrastive_loss": 2.268766403198242, - "train/negative_loss": 1.543207049369812, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.7255594730377197, - "train/total_loss": 0.6050528287887573 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.11724072694778442, - "train/contrastive_loss": 1.7187724113464355, - "train/negative_loss": 0.9036093950271606, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.8151630759239197, - "train/total_loss": 0.46099522709846497 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.15023350715637207, - "train/contrastive_loss": 2.089506149291992, - "train/negative_loss": 1.6780641078948975, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.4114419221878052, - "train/total_loss": 0.5681347846984863 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.10935751348733902, - "train/contrastive_loss": 2.6358447074890137, - "train/negative_loss": 2.6352412700653076, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0006034901598468423, - "train/total_loss": 0.6365264654159546 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.08799659460783005, - "train/contrastive_loss": 1.7378325462341309, - "train/negative_loss": 0.5925837755203247, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.1452487707138062, - "train/total_loss": 0.4355631172657013 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.16216714680194855, - "train/contrastive_loss": 0.8297275304794312, - "train/negative_loss": 0.5642201900482178, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.26550737023353577, - "train/total_loss": 0.3281126618385315 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.25973355770111084, - "train/contrastive_loss": 2.243715286254883, - "train/negative_loss": 1.3399286270141602, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.9037867188453674, - "train/total_loss": 0.7084766626358032 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.18791459500789642, - "train/contrastive_loss": 1.3426663875579834, - "train/negative_loss": 0.6202796697616577, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.7223866581916809, - "train/total_loss": 0.45644789934158325 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.22071129083633423, - "train/contrastive_loss": 1.9495770931243896, - "train/negative_loss": 1.1545584201812744, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.7950186729431152, - "train/total_loss": 0.6106266975402832 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.14231224358081818, - "train/contrastive_loss": 1.2542569637298584, - "train/negative_loss": 0.19935786724090576, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.0548990964889526, - "train/total_loss": 0.39316362142562866 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.2452002912759781, - "train/contrastive_loss": 1.5560941696166992, - "train/negative_loss": 0.2691787779331207, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.2869154214859009, - "train/total_loss": 0.5564191341400146 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.23663529753684998, - "train/contrastive_loss": 1.3775486946105957, - "train/negative_loss": 0.925042986869812, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.45250576734542847, - "train/total_loss": 0.5121450424194336 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.07845362275838852, - "train/contrastive_loss": 0.7954543828964233, - "train/negative_loss": 0.4313206970691681, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.36413368582725525, - "train/total_loss": 0.23754450678825378 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.16561201214790344, - "train/contrastive_loss": 1.0189707279205322, - "train/negative_loss": 0.21655909717082977, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.802411675453186, - "train/total_loss": 0.36940616369247437 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.06853518635034561, - "train/contrastive_loss": 0.6282175779342651, - "train/negative_loss": 0.44593679904937744, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.1822807788848877, - "train/total_loss": 0.19417870044708252 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.34788262844085693, - "train/contrastive_loss": 1.3699886798858643, - "train/negative_loss": 0.3455556631088257, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.0244330167770386, - "train/total_loss": 0.6218804121017456 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.2764991819858551, - "train/contrastive_loss": 3.217503547668457, - "train/negative_loss": 1.773716688156128, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.4437869787216187, - "train/total_loss": 0.9199999570846558 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.20955877006053925, - "train/contrastive_loss": 3.302365303039551, - "train/negative_loss": 2.490429639816284, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.8119356036186218, - "train/total_loss": 0.8700318336486816 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.2171807736158371, - "train/contrastive_loss": 1.8037488460540771, - "train/negative_loss": 0.7823337912559509, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.0214149951934814, - "train/total_loss": 0.5779305696487427 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.176733136177063, - "train/contrastive_loss": 0.7041789293289185, - "train/negative_loss": 0.19657324254512787, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.5076056718826294, - "train/total_loss": 0.31756892800331116 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.09462030977010727, - "train/contrastive_loss": 1.31255304813385, - "train/negative_loss": 0.8331683278083801, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.47938475012779236, - "train/total_loss": 0.3571309447288513 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.1923033446073532, - "train/contrastive_loss": 2.929457902908325, - "train/negative_loss": 1.5708318948745728, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3586260080337524, - "train/total_loss": 0.7781949639320374 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.25247204303741455, - "train/contrastive_loss": 0.772871196269989, - "train/negative_loss": 0.7726531028747559, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.00021811718761455268, - "train/total_loss": 0.40704628825187683 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.22146926820278168, - "train/contrastive_loss": 2.0676212310791016, - "train/negative_loss": 1.2929590940475464, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.7746620178222656, - "train/total_loss": 0.6349934935569763 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.21380868554115295, - "train/contrastive_loss": 2.9455060958862305, - "train/negative_loss": 2.581827163696289, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.3636789917945862, - "train/total_loss": 0.8029099702835083 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.18483966588974, - "train/contrastive_loss": 3.2915163040161133, - "train/negative_loss": 1.368869423866272, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.9226469993591309, - "train/total_loss": 0.8431429266929626 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.12599043548107147, - "train/contrastive_loss": 1.1470346450805664, - "train/negative_loss": 0.8504186272621155, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.2966160178184509, - "train/total_loss": 0.35539737343788147 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.14913268387317657, - "train/contrastive_loss": 0.8000763654708862, - "train/negative_loss": 0.8000510931015015, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 2.527268952690065e-05, - "train/total_loss": 0.3091479539871216 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.20327459275722504, - "train/contrastive_loss": 1.5472869873046875, - "train/negative_loss": 1.4924263954162598, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.05486058443784714, - "train/total_loss": 0.5127319693565369 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.20968754589557648, - "train/contrastive_loss": 2.962769031524658, - "train/negative_loss": 2.962587594985962, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.00018151261610910296, - "train/total_loss": 0.802241325378418 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.18618284165859222, - "train/contrastive_loss": 1.5515432357788086, - "train/negative_loss": 0.8168392777442932, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7347039580345154, - "train/total_loss": 0.4964914917945862 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.14554883539676666, - "train/contrastive_loss": 2.075991630554199, - "train/negative_loss": 1.7718762159347534, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.30411529541015625, - "train/total_loss": 0.5607471466064453 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.1801607757806778, - "train/contrastive_loss": 1.901669979095459, - "train/negative_loss": 0.3942953944206238, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5073745250701904, - "train/total_loss": 0.5604947805404663 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.16870692372322083, - "train/contrastive_loss": 2.829515218734741, - "train/negative_loss": 0.8600296378135681, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.9694855213165283, - "train/total_loss": 0.7346099615097046 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.11372324824333191, - "train/contrastive_loss": 0.5547425150871277, - "train/negative_loss": 0.1917402595281601, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.3630022704601288, - "train/total_loss": 0.22467175126075745 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.26039785146713257, - "train/contrastive_loss": 0.6836889982223511, - "train/negative_loss": 0.5185375213623047, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.16515150666236877, - "train/total_loss": 0.3971356749534607 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.10368897020816803, - "train/contrastive_loss": 0.8504205942153931, - "train/negative_loss": 0.850415825843811, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 4.7385860852955375e-06, - "train/total_loss": 0.27377307415008545 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.12556582689285278, - "train/contrastive_loss": 1.308447003364563, - "train/negative_loss": 0.46630313992500305, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8421438932418823, - "train/total_loss": 0.3872552216053009 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.10201260447502136, - "train/contrastive_loss": 1.3234342336654663, - "train/negative_loss": 1.1558152437210083, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1676190197467804, - "train/total_loss": 0.3666994571685791 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.1663467139005661, - "train/contrastive_loss": 1.7351765632629395, - "train/negative_loss": 0.8425161242485046, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.8926604986190796, - "train/total_loss": 0.5133820176124573 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.13315506279468536, - "train/contrastive_loss": 1.9594765901565552, - "train/negative_loss": 0.7074275016784668, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.2520490884780884, - "train/total_loss": 0.5250504016876221 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.16647471487522125, - "train/contrastive_loss": 1.093421459197998, - "train/negative_loss": 0.351399302482605, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7420222163200378, - "train/total_loss": 0.3851590156555176 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.22389748692512512, - "train/contrastive_loss": 1.3595372438430786, - "train/negative_loss": 0.7120992541313171, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.6474379897117615, - "train/total_loss": 0.49580493569374084 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.22418680787086487, - "train/contrastive_loss": 4.034985065460205, - "train/negative_loss": 3.1817445755004883, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.8532403111457825, - "train/total_loss": 1.0311838388442993 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.1837569624185562, - "train/contrastive_loss": 0.8700655698776245, - "train/negative_loss": 0.2784993350505829, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.591566264629364, - "train/total_loss": 0.35777008533477783 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.19098150730133057, - "train/contrastive_loss": 2.9631621837615967, - "train/negative_loss": 1.949090838432312, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0140713453292847, - "train/total_loss": 0.7836139798164368 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.3054370880126953, - "train/contrastive_loss": 3.860166072845459, - "train/negative_loss": 1.7680999040603638, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.0920662879943848, - "train/total_loss": 1.077470302581787 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.260538250207901, - "train/contrastive_loss": 3.305543899536133, - "train/negative_loss": 1.84992253780365, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4556214809417725, - "train/total_loss": 0.9216470718383789 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.16031259298324585, - "train/contrastive_loss": 2.6334595680236816, - "train/negative_loss": 1.9775406122207642, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.6559188365936279, - "train/total_loss": 0.6870045065879822 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.24214540421962738, - "train/contrastive_loss": 3.084965229034424, - "train/negative_loss": 1.3877253532409668, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.697239875793457, - "train/total_loss": 0.8591384887695312 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.32436472177505493, - "train/contrastive_loss": 5.102682590484619, - "train/negative_loss": 4.1288533210754395, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.9738292694091797, - "train/total_loss": 1.3449013233184814 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.3246716856956482, - "train/contrastive_loss": 2.9801456928253174, - "train/negative_loss": 1.7301511764526367, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.2499945163726807, - "train/total_loss": 0.9207008481025696 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.140066996216774, - "train/contrastive_loss": 0.5571708679199219, - "train/negative_loss": 0.5568914413452148, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0002794150204863399, - "train/total_loss": 0.2515011727809906 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.15304380655288696, - "train/contrastive_loss": 1.0120625495910645, - "train/negative_loss": 0.1963101029396057, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.815752387046814, - "train/total_loss": 0.35545632243156433 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.11709165573120117, - "train/contrastive_loss": 1.408087134361267, - "train/negative_loss": 0.4998573362827301, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.9082297682762146, - "train/total_loss": 0.39870908856391907 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.20291131734848022, - "train/contrastive_loss": 1.573814034461975, - "train/negative_loss": 1.573814034461975, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5176740884780884 - }, - { - "epoch": 18.631178707224336, - "eval_exact_match_accuracy": 0.33714285714285713, - "eval_hamming_loss": 0.06543417366946779, - "eval_loss": 0.5696276426315308, - "eval_macro_f1": 0.43341613821133007, - "eval_macro_precision": 0.6056686146947458, - "eval_macro_recall": 0.36430280191674336, - "eval_micro_f1": 0.6080536912751678, - "eval_micro_precision": 0.7414075286415712, - "eval_micro_recall": 0.515358361774744, - "eval_runtime": 2.6391, - "eval_samples_per_second": 198.934, - "eval_steps_per_second": 25.009, - "step": 4900 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.12065351754426956, - "train/contrastive_loss": 0.13385656476020813, - "train/negative_loss": 0.13090626895427704, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.0029502969700843096, - "train/total_loss": 0.1474248319864273 - }, - { - "epoch": 18.631178707224336, - "step": 4900, - "train/classification_loss": 0.07092077285051346, - "train/contrastive_loss": 0.22800198197364807, - "train/negative_loss": 0.20906810462474823, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.018933869898319244, - "train/total_loss": 0.11652116477489471 - }, - { - "epoch": 18.8212927756654, - "grad_norm": 4.045762538909912, - "learning_rate": 1.926240487062405e-05, - "loss": 0.3388, - "step": 4950 - }, - { - "epoch": 18.8212927756654, - "step": 4950, - "train/classification_loss": 0.10891631245613098, - "train/contrastive_loss": 0.5788666009902954, - "train/negative_loss": 0.07912429422140121, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.4997422993183136, - "train/total_loss": 0.22468963265419006 - }, - { - "epoch": 18.8212927756654, - "step": 4950, - "train/classification_loss": 0.06006965413689613, - "train/contrastive_loss": 0.49980199337005615, - "train/negative_loss": 0.2172553390264511, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.28254663944244385, - "train/total_loss": 0.1600300520658493 - }, - { - "epoch": 19.011406844106464, - "grad_norm": 6.631872177124023, - "learning_rate": 1.9254794520547944e-05, - "loss": 0.3344, - "step": 5000 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.3516407012939453, - "train/contrastive_loss": 2.8592889308929443, - "train/negative_loss": 1.8361667394638062, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.0231221914291382, - "train/total_loss": 0.9234985113143921 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1165451630949974, - "train/contrastive_loss": 1.0654938220977783, - "train/negative_loss": 0.6505488157272339, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.41494494676589966, - "train/total_loss": 0.32964393496513367 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22438736259937286, - "train/contrastive_loss": 1.458052396774292, - "train/negative_loss": 0.269084632396698, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.1889677047729492, - "train/total_loss": 0.5159978270530701 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.30204376578330994, - "train/contrastive_loss": 3.45542573928833, - "train/negative_loss": 2.3005690574645996, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.1548566818237305, - "train/total_loss": 0.9931288957595825 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.12378210574388504, - "train/contrastive_loss": 1.781229019165039, - "train/negative_loss": 1.1059647798538208, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.6752642393112183, - "train/total_loss": 0.4800279140472412 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22779859602451324, - "train/contrastive_loss": 2.45253849029541, - "train/negative_loss": 1.4290469884872437, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 1.023491621017456, - "train/total_loss": 0.718306303024292 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.25702646374702454, - "train/contrastive_loss": 3.2177159786224365, - "train/negative_loss": 1.841691493988037, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 1.3760244846343994, - "train/total_loss": 0.9005696773529053 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17715869843959808, - "train/contrastive_loss": 1.973620891571045, - "train/negative_loss": 1.56857430934906, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.4050465524196625, - "train/total_loss": 0.5718829035758972 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.18477115035057068, - "train/contrastive_loss": 2.513078451156616, - "train/negative_loss": 1.529137372970581, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.9839410781860352, - "train/total_loss": 0.6873868703842163 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.28026941418647766, - "train/contrastive_loss": 2.7949154376983643, - "train/negative_loss": 1.9314900636672974, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8634253144264221, - "train/total_loss": 0.8392524719238281 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17325127124786377, - "train/contrastive_loss": 2.243016242980957, - "train/negative_loss": 1.6338739395141602, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.6091424226760864, - "train/total_loss": 0.6218545436859131 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.13500185310840607, - "train/contrastive_loss": 2.7524569034576416, - "train/negative_loss": 1.2563393115997314, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.4961175918579102, - "train/total_loss": 0.6854932308197021 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.15344908833503723, - "train/contrastive_loss": 3.0950801372528076, - "train/negative_loss": 1.6504778861999512, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.4446022510528564, - "train/total_loss": 0.7724651098251343 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.0842185840010643, - "train/contrastive_loss": 1.6382472515106201, - "train/negative_loss": 1.6378620862960815, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0003851776709780097, - "train/total_loss": 0.41186803579330444 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.08658070117235184, - "train/contrastive_loss": 1.5901274681091309, - "train/negative_loss": 0.5260459780693054, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.0640814304351807, - "train/total_loss": 0.4046061933040619 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.16730442643165588, - "train/contrastive_loss": 1.988673210144043, - "train/negative_loss": 0.8517283797264099, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 1.1369447708129883, - "train/total_loss": 0.5650390386581421 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2646237015724182, - "train/contrastive_loss": 1.666684627532959, - "train/negative_loss": 1.006531000137329, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6601536870002747, - "train/total_loss": 0.5979605913162231 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.20833104848861694, - "train/contrastive_loss": 1.6457819938659668, - "train/negative_loss": 0.7469335198402405, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8988484144210815, - "train/total_loss": 0.5374874472618103 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.20563043653964996, - "train/contrastive_loss": 0.9478499889373779, - "train/negative_loss": 0.8972486257553101, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.05060138925909996, - "train/total_loss": 0.3952004313468933 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1350526213645935, - "train/contrastive_loss": 0.5865288376808167, - "train/negative_loss": 0.17623074352741241, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.41029807925224304, - "train/total_loss": 0.2523583769798279 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.20629911124706268, - "train/contrastive_loss": 1.5724763870239258, - "train/negative_loss": 0.2040473371744156, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.3684290647506714, - "train/total_loss": 0.5207943916320801 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22182372212409973, - "train/contrastive_loss": 1.6953296661376953, - "train/negative_loss": 1.2015963792800903, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.4937332570552826, - "train/total_loss": 0.5608896613121033 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.10547708719968796, - "train/contrastive_loss": 1.135160207748413, - "train/negative_loss": 0.2322371006011963, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.9029231071472168, - "train/total_loss": 0.3325091302394867 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17046909034252167, - "train/contrastive_loss": 0.598738968372345, - "train/negative_loss": 0.4110839068889618, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.18765507638454437, - "train/total_loss": 0.2902168929576874 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.10916648060083389, - "train/contrastive_loss": 1.991458535194397, - "train/negative_loss": 0.515156626701355, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 1.476301908493042, - "train/total_loss": 0.5074582099914551 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.37656304240226746, - "train/contrastive_loss": 1.9633184671401978, - "train/negative_loss": 0.8328806161880493, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.1304378509521484, - "train/total_loss": 0.7692267298698425 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2883675992488861, - "train/contrastive_loss": 2.9357688426971436, - "train/negative_loss": 1.407473087310791, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.5282957553863525, - "train/total_loss": 0.8755214214324951 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.24775803089141846, - "train/contrastive_loss": 4.148109436035156, - "train/negative_loss": 2.7852118015289307, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.3628973960876465, - "train/total_loss": 1.0773799419403076 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.20035028457641602, - "train/contrastive_loss": 1.750627040863037, - "train/negative_loss": 0.8332614302635193, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9173656702041626, - "train/total_loss": 0.5504757165908813 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.20482127368450165, - "train/contrastive_loss": 1.346954345703125, - "train/negative_loss": 1.2867419719696045, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.060212355107069016, - "train/total_loss": 0.4742121696472168 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.09604935348033905, - "train/contrastive_loss": 1.5359387397766113, - "train/negative_loss": 1.0004146099090576, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.5355241298675537, - "train/total_loss": 0.40323710441589355 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22871704399585724, - "train/contrastive_loss": 1.7241913080215454, - "train/negative_loss": 1.0290513038635254, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.69514000415802, - "train/total_loss": 0.5735552906990051 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22213789820671082, - "train/contrastive_loss": 0.7944575548171997, - "train/negative_loss": 0.7866762280464172, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.007781303022056818, - "train/total_loss": 0.3810294270515442 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2278968244791031, - "train/contrastive_loss": 1.3110227584838867, - "train/negative_loss": 0.6494556069374084, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.6615671515464783, - "train/total_loss": 0.4901013970375061 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17688676714897156, - "train/contrastive_loss": 2.2769014835357666, - "train/negative_loss": 1.8922940492630005, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.38460734486579895, - "train/total_loss": 0.6322670578956604 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17643260955810547, - "train/contrastive_loss": 3.3899927139282227, - "train/negative_loss": 1.3734283447265625, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.01656436920166, - "train/total_loss": 0.85443115234375 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.13014589250087738, - "train/contrastive_loss": 1.6855827569961548, - "train/negative_loss": 1.1843578815460205, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.5012248754501343, - "train/total_loss": 0.4672624468803406 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.18326237797737122, - "train/contrastive_loss": 0.7855522036552429, - "train/negative_loss": 0.7842586636543274, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.0012935417471453547, - "train/total_loss": 0.34037280082702637 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.19307972490787506, - "train/contrastive_loss": 1.18247389793396, - "train/negative_loss": 0.9061206579208374, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.27635326981544495, - "train/total_loss": 0.42957448959350586 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1673821657896042, - "train/contrastive_loss": 1.9970266819000244, - "train/negative_loss": 1.9969236850738525, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.00010300213034497574, - "train/total_loss": 0.5667874813079834 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17857159674167633, - "train/contrastive_loss": 1.139397382736206, - "train/negative_loss": 0.750109851360321, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.389287531375885, - "train/total_loss": 0.4064510762691498 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2148527204990387, - "train/contrastive_loss": 2.0440211296081543, - "train/negative_loss": 1.4633852243423462, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.5806359052658081, - "train/total_loss": 0.6236569881439209 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.19486847519874573, - "train/contrastive_loss": 1.7963638305664062, - "train/negative_loss": 0.3964255154132843, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.3999383449554443, - "train/total_loss": 0.5541412830352783 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.18719039857387543, - "train/contrastive_loss": 2.7530205249786377, - "train/negative_loss": 0.9825562834739685, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.7704641819000244, - "train/total_loss": 0.7377945184707642 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1633107215166092, - "train/contrastive_loss": 1.467667579650879, - "train/negative_loss": 0.798516571521759, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.6691509485244751, - "train/total_loss": 0.4568442702293396 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.23625649511814117, - "train/contrastive_loss": 0.6562273502349854, - "train/negative_loss": 0.605872392654419, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.05035495385527611, - "train/total_loss": 0.36750197410583496 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.11674932390451431, - "train/contrastive_loss": 0.7404046058654785, - "train/negative_loss": 0.6169583797454834, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.12344621121883392, - "train/total_loss": 0.26483026146888733 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1293659508228302, - "train/contrastive_loss": 1.4970064163208008, - "train/negative_loss": 0.2274194061756134, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.2695870399475098, - "train/total_loss": 0.42876723408699036 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.09113286435604095, - "train/contrastive_loss": 1.261164903640747, - "train/negative_loss": 1.0886900424957275, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.1724749058485031, - "train/total_loss": 0.3433658480644226 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.15919797122478485, - "train/contrastive_loss": 0.8560980558395386, - "train/negative_loss": 0.2140226662158966, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.6420754194259644, - "train/total_loss": 0.33041757345199585 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.16043870151042938, - "train/contrastive_loss": 2.3157782554626465, - "train/negative_loss": 0.6482589244842529, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.6675193309783936, - "train/total_loss": 0.623594343662262 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1665107011795044, - "train/contrastive_loss": 1.4511775970458984, - "train/negative_loss": 0.44313329458236694, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0080442428588867, - "train/total_loss": 0.4567462205886841 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.22651854157447815, - "train/contrastive_loss": 1.9404492378234863, - "train/negative_loss": 1.018746018409729, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.9217032194137573, - "train/total_loss": 0.6146084070205688 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2429175078868866, - "train/contrastive_loss": 3.59804368019104, - "train/negative_loss": 2.6141581535339355, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.9838854670524597, - "train/total_loss": 0.9625262022018433 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.18345658481121063, - "train/contrastive_loss": 1.4633859395980835, - "train/negative_loss": 0.3913284242153168, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.0720574855804443, - "train/total_loss": 0.4761337637901306 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.21223090589046478, - "train/contrastive_loss": 3.1898303031921387, - "train/negative_loss": 2.410352945327759, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7794772982597351, - "train/total_loss": 0.8501970171928406 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.3192982077598572, - "train/contrastive_loss": 3.9914443492889404, - "train/negative_loss": 1.85394287109375, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.1375014781951904, - "train/total_loss": 1.1175870895385742 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2670833170413971, - "train/contrastive_loss": 3.4713821411132812, - "train/negative_loss": 1.8384325504302979, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.6329495906829834, - "train/total_loss": 0.9613597393035889 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.17855772376060486, - "train/contrastive_loss": 2.1565463542938232, - "train/negative_loss": 1.399830937385559, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.7567154765129089, - "train/total_loss": 0.6098669767379761 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.24300581216812134, - "train/contrastive_loss": 4.175110816955566, - "train/negative_loss": 1.7504757642745972, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.4246349334716797, - "train/total_loss": 1.0780279636383057 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.31568410992622375, - "train/contrastive_loss": 2.9845447540283203, - "train/negative_loss": 1.9251869916915894, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.0593578815460205, - "train/total_loss": 0.9125931262969971 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.33571699261665344, - "train/contrastive_loss": 3.060267210006714, - "train/negative_loss": 1.7666120529174805, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.2936551570892334, - "train/total_loss": 0.9477704763412476 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.14385531842708588, - "train/contrastive_loss": 0.6475963592529297, - "train/negative_loss": 0.6464225053787231, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.0011738582979887724, - "train/total_loss": 0.2733745872974396 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1801847517490387, - "train/contrastive_loss": 1.8012726306915283, - "train/negative_loss": 1.0239167213439941, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.777355968952179, - "train/total_loss": 0.540439248085022 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1193602904677391, - "train/contrastive_loss": 0.8846020102500916, - "train/negative_loss": 0.32093530893325806, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.5636667013168335, - "train/total_loss": 0.2962806820869446 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.2049509584903717, - "train/contrastive_loss": 1.761587381362915, - "train/negative_loss": 1.761587381362915, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5572684407234192 - }, - { - "epoch": 19.011406844106464, - "eval_exact_match_accuracy": 0.3028571428571429, - "eval_hamming_loss": 0.0684593837535014, - "eval_loss": 0.5925257205963135, - "eval_macro_f1": 0.4548080220813918, - "eval_macro_precision": 0.6128483046085954, - "eval_macro_recall": 0.3819020136578391, - "eval_micro_f1": 0.5863236289776574, - "eval_micro_precision": 0.7240802675585284, - "eval_micro_recall": 0.4926052332195677, - "eval_runtime": 2.6391, - "eval_samples_per_second": 198.93, - "eval_steps_per_second": 25.008, - "step": 5000 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.07001924514770508, - "train/contrastive_loss": 0.45223018527030945, - "train/negative_loss": 0.4474566876888275, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.004773502703756094, - "train/total_loss": 0.1604652851819992 - }, - { - "epoch": 19.011406844106464, - "step": 5000, - "train/classification_loss": 0.1049448773264885, - "train/contrastive_loss": 0.9611953496932983, - "train/negative_loss": 0.7069152593612671, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.25428009033203125, - "train/total_loss": 0.29718396067619324 - }, - { - "epoch": 19.20152091254753, - "grad_norm": 9.053022384643555, - "learning_rate": 1.9247184170471846e-05, - "loss": 0.3044, - "step": 5050 - }, - { - "epoch": 19.20152091254753, - "step": 5050, - "train/classification_loss": 0.06491824239492416, - "train/contrastive_loss": 0.7314701676368713, - "train/negative_loss": 0.7299368381500244, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.0015333382179960608, - "train/total_loss": 0.21121227741241455 - }, - { - "epoch": 19.20152091254753, - "step": 5050, - "train/classification_loss": 0.08453147858381271, - "train/contrastive_loss": 0.6660484075546265, - "train/negative_loss": 0.6650282740592957, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.0010201274417340755, - "train/total_loss": 0.21774116158485413 - }, - { - "epoch": 19.39163498098859, - "grad_norm": 5.277036190032959, - "learning_rate": 1.923957382039574e-05, - "loss": 0.3148, - "step": 5100 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.3698623776435852, - "train/contrastive_loss": 2.6759262084960938, - "train/negative_loss": 0.7692548632621765, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 1.9066712856292725, - "train/total_loss": 0.9050476551055908 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10393465310335159, - "train/contrastive_loss": 1.4043611288070679, - "train/negative_loss": 0.831790566444397, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.5725705623626709, - "train/total_loss": 0.38480687141418457 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.19396303594112396, - "train/contrastive_loss": 1.8987939357757568, - "train/negative_loss": 0.8665583729743958, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 1.0322355031967163, - "train/total_loss": 0.5737218260765076 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.28149011731147766, - "train/contrastive_loss": 5.094486236572266, - "train/negative_loss": 4.120715618133545, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 0.9737703800201416, - "train/total_loss": 1.3003873825073242 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10420398414134979, - "train/contrastive_loss": 0.9526112675666809, - "train/negative_loss": 0.8404656648635864, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.11214561015367508, - "train/total_loss": 0.29472625255584717 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.18230314552783966, - "train/contrastive_loss": 2.2218265533447266, - "train/negative_loss": 1.4188237190246582, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.8030028343200684, - "train/total_loss": 0.6266684532165527 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.18679599463939667, - "train/contrastive_loss": 1.2578719854354858, - "train/negative_loss": 0.9185248017311096, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.3393471837043762, - "train/total_loss": 0.43837040662765503 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.14052383601665497, - "train/contrastive_loss": 1.123228907585144, - "train/negative_loss": 0.9359996318817139, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.18722930550575256, - "train/total_loss": 0.36516961455345154 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1376192718744278, - "train/contrastive_loss": 1.1049070358276367, - "train/negative_loss": 1.0997581481933594, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.005148882046341896, - "train/total_loss": 0.3586006760597229 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.346784383058548, - "train/contrastive_loss": 3.2339320182800293, - "train/negative_loss": 1.4288676977157593, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.8050642013549805, - "train/total_loss": 0.9935708045959473 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.15326015651226044, - "train/contrastive_loss": 2.320387363433838, - "train/negative_loss": 1.6063400506973267, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.7140474319458008, - "train/total_loss": 0.6173376441001892 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10113024711608887, - "train/contrastive_loss": 1.3319952487945557, - "train/negative_loss": 0.6322072148323059, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.699787974357605, - "train/total_loss": 0.3675293028354645 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.17560745775699615, - "train/contrastive_loss": 2.9526939392089844, - "train/negative_loss": 2.390446186065674, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.5622477531433105, - "train/total_loss": 0.7661462426185608 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.09586081653833389, - "train/contrastive_loss": 2.374415874481201, - "train/negative_loss": 2.373868703842163, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.0005471670883707702, - "train/total_loss": 0.570743978023529 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1003912165760994, - "train/contrastive_loss": 2.180673122406006, - "train/negative_loss": 0.7473078370094299, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.4333652257919312, - "train/total_loss": 0.5365258455276489 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.12923046946525574, - "train/contrastive_loss": 0.6791248321533203, - "train/negative_loss": 0.42090681195259094, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.25821802020072937, - "train/total_loss": 0.26505541801452637 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.25079816579818726, - "train/contrastive_loss": 2.837977647781372, - "train/negative_loss": 1.9737743139266968, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.8642033338546753, - "train/total_loss": 0.8183937072753906 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.17149528861045837, - "train/contrastive_loss": 0.9064697027206421, - "train/negative_loss": 0.34605878591537476, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.5604109168052673, - "train/total_loss": 0.3527892231941223 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2093166708946228, - "train/contrastive_loss": 1.4458942413330078, - "train/negative_loss": 0.9565778374671936, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.489316463470459, - "train/total_loss": 0.49849551916122437 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.12715847790241241, - "train/contrastive_loss": 1.9157135486602783, - "train/negative_loss": 0.40784135460853577, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.507872223854065, - "train/total_loss": 0.5103011727333069 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.21916015446186066, - "train/contrastive_loss": 1.6026209592819214, - "train/negative_loss": 0.19360707700252533, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.4090138673782349, - "train/total_loss": 0.5396843552589417 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.22333799302577972, - "train/contrastive_loss": 2.050232410430908, - "train/negative_loss": 1.0622599124908447, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.9879724979400635, - "train/total_loss": 0.6333844661712646 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.07895489037036896, - "train/contrastive_loss": 1.271514654159546, - "train/negative_loss": 0.9567714929580688, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.31474316120147705, - "train/total_loss": 0.33325785398483276 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.15753883123397827, - "train/contrastive_loss": 0.40570539236068726, - "train/negative_loss": 0.2792322039604187, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.12647318840026855, - "train/total_loss": 0.2386799156665802 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.075721874833107, - "train/contrastive_loss": 0.8724719882011414, - "train/negative_loss": 0.39109331369400024, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.4813786745071411, - "train/total_loss": 0.2502162754535675 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.3413824439048767, - "train/contrastive_loss": 2.209663152694702, - "train/negative_loss": 0.815055787563324, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 1.3946073055267334, - "train/total_loss": 0.7833150625228882 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.3058488070964813, - "train/contrastive_loss": 2.8725008964538574, - "train/negative_loss": 1.474735975265503, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.3977649211883545, - "train/total_loss": 0.8803490400314331 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2247866541147232, - "train/contrastive_loss": 4.765553951263428, - "train/negative_loss": 3.3824691772460938, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 1.383084774017334, - "train/total_loss": 1.1778974533081055 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.20482195913791656, - "train/contrastive_loss": 1.2297031879425049, - "train/negative_loss": 0.7280491590499878, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.5016540288925171, - "train/total_loss": 0.4507625997066498 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.20148077607154846, - "train/contrastive_loss": 0.9316743016242981, - "train/negative_loss": 0.5076207518577576, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.4240535497665405, - "train/total_loss": 0.3878156542778015 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10963578522205353, - "train/contrastive_loss": 1.0138810873031616, - "train/negative_loss": 0.300618439912796, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.7132626175880432, - "train/total_loss": 0.3124120235443115 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2112964540719986, - "train/contrastive_loss": 2.7759504318237305, - "train/negative_loss": 1.3096113204956055, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.466339111328125, - "train/total_loss": 0.7664865255355835 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.24035952985286713, - "train/contrastive_loss": 0.9000216722488403, - "train/negative_loss": 0.8999444246292114, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 7.725060277152807e-05, - "train/total_loss": 0.4203638732433319 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.19315248727798462, - "train/contrastive_loss": 1.8279398679733276, - "train/negative_loss": 0.8039673566818237, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 1.023972511291504, - "train/total_loss": 0.558740496635437 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.20331992208957672, - "train/contrastive_loss": 3.1230015754699707, - "train/negative_loss": 2.6322884559631348, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.49071305990219116, - "train/total_loss": 0.8279202580451965 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1773516684770584, - "train/contrastive_loss": 3.366360664367676, - "train/negative_loss": 1.3633431196212769, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 2.0030174255371094, - "train/total_loss": 0.8506237864494324 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1420053243637085, - "train/contrastive_loss": 1.612426519393921, - "train/negative_loss": 0.9641430974006653, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.6482833623886108, - "train/total_loss": 0.4644906222820282 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.170328751206398, - "train/contrastive_loss": 1.5592455863952637, - "train/negative_loss": 0.9382426142692566, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.6210030317306519, - "train/total_loss": 0.48217785358428955 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.19212493300437927, - "train/contrastive_loss": 1.2758110761642456, - "train/negative_loss": 1.2463244199752808, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.029486600309610367, - "train/total_loss": 0.4472871422767639 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1890140175819397, - "train/contrastive_loss": 2.2275404930114746, - "train/negative_loss": 2.2272112369537354, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.0003293102781753987, - "train/total_loss": 0.6345220804214478 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2121141105890274, - "train/contrastive_loss": 2.337057590484619, - "train/negative_loss": 1.2556827068328857, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.0813748836517334, - "train/total_loss": 0.67952561378479 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.12232281267642975, - "train/contrastive_loss": 1.017864465713501, - "train/negative_loss": 0.8443743586540222, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.17349016666412354, - "train/total_loss": 0.3258957266807556 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.18604333698749542, - "train/contrastive_loss": 2.141390085220337, - "train/negative_loss": 0.31810492277145386, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.8232851028442383, - "train/total_loss": 0.6143213510513306 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.18216831982135773, - "train/contrastive_loss": 2.305811643600464, - "train/negative_loss": 0.817948043346405, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.487863540649414, - "train/total_loss": 0.6433306336402893 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10920170694589615, - "train/contrastive_loss": 0.7275854349136353, - "train/negative_loss": 0.23968468606472015, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.4879007637500763, - "train/total_loss": 0.2547188103199005 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.276057630777359, - "train/contrastive_loss": 1.3045639991760254, - "train/negative_loss": 0.7614874243736267, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.5430766344070435, - "train/total_loss": 0.5369704365730286 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.12319669872522354, - "train/contrastive_loss": 0.9882625341415405, - "train/negative_loss": 0.9882609844207764, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.519920033388189e-06, - "train/total_loss": 0.32084921002388 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.11485397070646286, - "train/contrastive_loss": 1.0735572576522827, - "train/negative_loss": 0.1874774694442749, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 0.8860797882080078, - "train/total_loss": 0.3295654356479645 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1141357421875, - "train/contrastive_loss": 1.4314152002334595, - "train/negative_loss": 1.239830493927002, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.19158469140529633, - "train/total_loss": 0.40041878819465637 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.13311076164245605, - "train/contrastive_loss": 1.2811287641525269, - "train/negative_loss": 1.2645262479782104, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.01660247892141342, - "train/total_loss": 0.3893365263938904 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1483631730079651, - "train/contrastive_loss": 2.382749080657959, - "train/negative_loss": 0.9488394856452942, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.43390953540802, - "train/total_loss": 0.6249129772186279 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.15227176249027252, - "train/contrastive_loss": 0.3508017063140869, - "train/negative_loss": 0.2281552106142044, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.12264649569988251, - "train/total_loss": 0.22243210673332214 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.19560956954956055, - "train/contrastive_loss": 1.5553505420684814, - "train/negative_loss": 0.7946575880050659, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7606930136680603, - "train/total_loss": 0.5066796541213989 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.21954160928726196, - "train/contrastive_loss": 3.3688101768493652, - "train/negative_loss": 3.036153793334961, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.3326563835144043, - "train/total_loss": 0.893303632736206 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.10490699112415314, - "train/contrastive_loss": 0.16357746720314026, - "train/negative_loss": 0.14898227155208588, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.01459519099444151, - "train/total_loss": 0.13762249052524567 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2197791486978531, - "train/contrastive_loss": 2.902954578399658, - "train/negative_loss": 2.140805959701538, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.7621486186981201, - "train/total_loss": 0.8003700375556946 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.31193792819976807, - "train/contrastive_loss": 4.510496616363525, - "train/negative_loss": 1.5290666818618774, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.9814300537109375, - "train/total_loss": 1.2140371799468994 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.2548889219760895, - "train/contrastive_loss": 2.6819310188293457, - "train/negative_loss": 1.4962453842163086, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.185685634613037, - "train/total_loss": 0.791275143623352 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.1781868040561676, - "train/contrastive_loss": 3.2525482177734375, - "train/negative_loss": 3.1017394065856934, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.1508088856935501, - "train/total_loss": 0.8286964893341064 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.3030659258365631, - "train/contrastive_loss": 3.7897889614105225, - "train/negative_loss": 1.5232772827148438, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 2.2665116786956787, - "train/total_loss": 1.0610237121582031 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.3409271538257599, - "train/contrastive_loss": 6.211893081665039, - "train/negative_loss": 4.911285877227783, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 1.3006070852279663, - "train/total_loss": 1.5833057165145874 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.35973450541496277, - "train/contrastive_loss": 3.7620949745178223, - "train/negative_loss": 1.9103055000305176, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.8517894744873047, - "train/total_loss": 1.1121535301208496 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.14231440424919128, - "train/contrastive_loss": 0.6412686705589294, - "train/negative_loss": 0.6411524415016174, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 0.00011621267913142219, - "train/total_loss": 0.2705681324005127 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.14932604134082794, - "train/contrastive_loss": 0.9865167737007141, - "train/negative_loss": 0.16664361953735352, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.8198731541633606, - "train/total_loss": 0.34662938117980957 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.11440487205982208, - "train/contrastive_loss": 1.4588556289672852, - "train/negative_loss": 0.4864273965358734, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.9724282622337341, - "train/total_loss": 0.40617603063583374 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.23159873485565186, - "train/contrastive_loss": 1.8787498474121094, - "train/negative_loss": 1.8787498474121094, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.6073486804962158 - }, - { - "epoch": 19.39163498098859, - "eval_exact_match_accuracy": 0.34285714285714286, - "eval_hamming_loss": 0.06442577030812324, - "eval_loss": 0.5890817046165466, - "eval_macro_f1": 0.4574985391985109, - "eval_macro_precision": 0.5458362162788296, - "eval_macro_recall": 0.40255674700187605, - "eval_micro_f1": 0.6263807667316439, - "eval_micro_precision": 0.7303030303030303, - "eval_micro_recall": 0.5483503981797497, - "eval_runtime": 2.6385, - "eval_samples_per_second": 198.973, - "eval_steps_per_second": 25.014, - "step": 5100 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.06601797789335251, - "train/contrastive_loss": 0.2431696057319641, - "train/negative_loss": 0.24171310663223267, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.0014564929297193885, - "train/total_loss": 0.11465190351009369 - }, - { - "epoch": 19.39163498098859, - "step": 5100, - "train/classification_loss": 0.06403198838233948, - "train/contrastive_loss": 0.16218844056129456, - "train/negative_loss": 0.16084949672222137, - "train/num_negatives": 40, - "train/num_positives": 12, - "train/positive_loss": 0.0013389450032263994, - "train/total_loss": 0.09646967798471451 - }, - { - "epoch": 19.581749049429657, - "grad_norm": 5.913722038269043, - "learning_rate": 1.9231963470319635e-05, - "loss": 0.3157, - "step": 5150 - }, - { - "epoch": 19.581749049429657, - "step": 5150, - "train/classification_loss": 0.1581401228904724, - "train/contrastive_loss": 1.0865373611450195, - "train/negative_loss": 0.4952530860900879, - "train/num_negatives": 36, - "train/num_positives": 6, - "train/positive_loss": 0.5912842750549316, - "train/total_loss": 0.3754476010799408 - }, - { - "epoch": 19.581749049429657, - "step": 5150, - "train/classification_loss": 0.05957839637994766, - "train/contrastive_loss": 0.17918917536735535, - "train/negative_loss": 0.1789633184671402, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.0002258641761727631, - "train/total_loss": 0.09541623294353485 - }, - { - "epoch": 19.771863117870723, - "grad_norm": 7.050843715667725, - "learning_rate": 1.9224353120243533e-05, - "loss": 0.3474, - "step": 5200 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.38127702474594116, - "train/contrastive_loss": 2.8317301273345947, - "train/negative_loss": 0.673801839351654, - "train/num_negatives": 28, - "train/num_positives": 14, - "train/positive_loss": 2.157928228378296, - "train/total_loss": 0.947623074054718 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.13723628222942352, - "train/contrastive_loss": 1.4218244552612305, - "train/negative_loss": 0.8191949725151062, - "train/num_negatives": 38, - "train/num_positives": 14, - "train/positive_loss": 0.6026294231414795, - "train/total_loss": 0.42160117626190186 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.18887247145175934, - "train/contrastive_loss": 1.5046167373657227, - "train/negative_loss": 0.5821987390518188, - "train/num_negatives": 30, - "train/num_positives": 22, - "train/positive_loss": 0.9224179983139038, - "train/total_loss": 0.4897958040237427 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.24681077897548676, - "train/contrastive_loss": 2.8054347038269043, - "train/negative_loss": 1.5432003736495972, - "train/num_negatives": 34, - "train/num_positives": 18, - "train/positive_loss": 1.2622342109680176, - "train/total_loss": 0.8078977465629578 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.08479398488998413, - "train/contrastive_loss": 1.5166633129119873, - "train/negative_loss": 1.2479357719421387, - "train/num_negatives": 18, - "train/num_positives": 26, - "train/positive_loss": 0.2687276005744934, - "train/total_loss": 0.3881266415119171 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20703189074993134, - "train/contrastive_loss": 1.7857131958007812, - "train/negative_loss": 1.321738362312317, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.46397486329078674, - "train/total_loss": 0.5641745328903198 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.19493426382541656, - "train/contrastive_loss": 2.599797487258911, - "train/negative_loss": 1.7355132102966309, - "train/num_negatives": 42, - "train/num_positives": 8, - "train/positive_loss": 0.8642842173576355, - "train/total_loss": 0.7148937582969666 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1491476446390152, - "train/contrastive_loss": 0.9527331590652466, - "train/negative_loss": 0.6921647787094116, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.2605683505535126, - "train/total_loss": 0.3396942615509033 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.13796234130859375, - "train/contrastive_loss": 1.0169799327850342, - "train/negative_loss": 1.011488676071167, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 0.005491302348673344, - "train/total_loss": 0.34135833382606506 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.3676392734050751, - "train/contrastive_loss": 3.004791021347046, - "train/negative_loss": 1.6633069515228271, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3414840698242188, - "train/total_loss": 0.9685975313186646 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.16941159963607788, - "train/contrastive_loss": 2.5106496810913086, - "train/negative_loss": 1.623809814453125, - "train/num_negatives": 40, - "train/num_positives": 16, - "train/positive_loss": 0.8868399858474731, - "train/total_loss": 0.6715415716171265 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.10129193961620331, - "train/contrastive_loss": 1.4281657934188843, - "train/negative_loss": 0.4144417345523834, - "train/num_negatives": 44, - "train/num_positives": 12, - "train/positive_loss": 1.0137240886688232, - "train/total_loss": 0.3869251012802124 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.23469053208827972, - "train/contrastive_loss": 2.7812581062316895, - "train/negative_loss": 1.780656099319458, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 1.000601887702942, - "train/total_loss": 0.7909421920776367 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.08199139684438705, - "train/contrastive_loss": 2.1383068561553955, - "train/negative_loss": 2.1381425857543945, - "train/num_negatives": 36, - "train/num_positives": 16, - "train/positive_loss": 0.00016415378195233643, - "train/total_loss": 0.5096527934074402 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.10232949256896973, - "train/contrastive_loss": 1.7119238376617432, - "train/negative_loss": 1.0523786544799805, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 0.6595451235771179, - "train/total_loss": 0.4447142779827118 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.16575588285923004, - "train/contrastive_loss": 0.8818964958190918, - "train/negative_loss": 0.6012705564498901, - "train/num_negatives": 42, - "train/num_positives": 10, - "train/positive_loss": 0.2806259095668793, - "train/total_loss": 0.3421351909637451 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.2440429925918579, - "train/contrastive_loss": 2.1688828468322754, - "train/negative_loss": 1.068967580795288, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.0999152660369873, - "train/total_loss": 0.6778196096420288 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.18377596139907837, - "train/contrastive_loss": 1.1754786968231201, - "train/negative_loss": 0.3431337773799896, - "train/num_negatives": 32, - "train/num_positives": 16, - "train/positive_loss": 0.8323449492454529, - "train/total_loss": 0.4188717007637024 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20056022703647614, - "train/contrastive_loss": 1.397731065750122, - "train/negative_loss": 0.9591307640075684, - "train/num_negatives": 44, - "train/num_positives": 6, - "train/positive_loss": 0.4386003613471985, - "train/total_loss": 0.4801064729690552 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1167166605591774, - "train/contrastive_loss": 1.4150052070617676, - "train/negative_loss": 1.3631443977355957, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 0.05186082050204277, - "train/total_loss": 0.39971768856048584 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.21452808380126953, - "train/contrastive_loss": 1.4901407957077026, - "train/negative_loss": 0.28379368782043457, - "train/num_negatives": 44, - "train/num_positives": 10, - "train/positive_loss": 1.206347107887268, - "train/total_loss": 0.512556254863739 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20542076230049133, - "train/contrastive_loss": 1.6336544752120972, - "train/negative_loss": 0.98520427942276, - "train/num_negatives": 44, - "train/num_positives": 8, - "train/positive_loss": 0.6484501957893372, - "train/total_loss": 0.5321516990661621 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.07951901853084564, - "train/contrastive_loss": 1.0222444534301758, - "train/negative_loss": 0.39424216747283936, - "train/num_negatives": 32, - "train/num_positives": 24, - "train/positive_loss": 0.6280022263526917, - "train/total_loss": 0.28396791219711304 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.15316890180110931, - "train/contrastive_loss": 0.23588962852954865, - "train/negative_loss": 0.2330215573310852, - "train/num_negatives": 34, - "train/num_positives": 20, - "train/positive_loss": 0.0028680660761892796, - "train/total_loss": 0.20034682750701904 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.07186581194400787, - "train/contrastive_loss": 0.7526023387908936, - "train/negative_loss": 0.46662360429763794, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.285978764295578, - "train/total_loss": 0.22238628566265106 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.33328238129615784, - "train/contrastive_loss": 1.106252670288086, - "train/negative_loss": 0.10670841485261917, - "train/num_negatives": 14, - "train/num_positives": 24, - "train/positive_loss": 0.9995442628860474, - "train/total_loss": 0.5545328855514526 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.28357329964637756, - "train/contrastive_loss": 2.592824935913086, - "train/negative_loss": 1.3111975193023682, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 1.2816275358200073, - "train/total_loss": 0.8021383285522461 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20957691967487335, - "train/contrastive_loss": 3.5395078659057617, - "train/negative_loss": 2.8116941452026367, - "train/num_negatives": 34, - "train/num_positives": 16, - "train/positive_loss": 0.7278137803077698, - "train/total_loss": 0.9174785017967224 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.25006917119026184, - "train/contrastive_loss": 2.2770726680755615, - "train/negative_loss": 0.9018885493278503, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 1.3751840591430664, - "train/total_loss": 0.7054836750030518 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.21985496580600739, - "train/contrastive_loss": 1.2137991189956665, - "train/negative_loss": 1.1689221858978271, - "train/num_negatives": 30, - "train/num_positives": 16, - "train/positive_loss": 0.04487690329551697, - "train/total_loss": 0.4626147747039795 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.08212298899888992, - "train/contrastive_loss": 0.7507438659667969, - "train/negative_loss": 0.5931333303451538, - "train/num_negatives": 32, - "train/num_positives": 18, - "train/positive_loss": 0.15761050581932068, - "train/total_loss": 0.23227176070213318 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20729754865169525, - "train/contrastive_loss": 2.813957691192627, - "train/negative_loss": 1.7435202598571777, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.0704374313354492, - "train/total_loss": 0.7700890898704529 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.2545546591281891, - "train/contrastive_loss": 0.7796552181243896, - "train/negative_loss": 0.77924644947052, - "train/num_negatives": 50, - "train/num_positives": 2, - "train/positive_loss": 0.0004087926063220948, - "train/total_loss": 0.4104856848716736 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1561874896287918, - "train/contrastive_loss": 0.6810390949249268, - "train/negative_loss": 0.6791176199913025, - "train/num_negatives": 38, - "train/num_positives": 12, - "train/positive_loss": 0.0019215010106563568, - "train/total_loss": 0.29239529371261597 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20472605526447296, - "train/contrastive_loss": 3.69364070892334, - "train/negative_loss": 2.804802656173706, - "train/num_negatives": 52, - "train/num_positives": 4, - "train/positive_loss": 0.8888381123542786, - "train/total_loss": 0.9434542059898376 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.20216096937656403, - "train/contrastive_loss": 3.2280125617980957, - "train/negative_loss": 1.513316035270691, - "train/num_negatives": 50, - "train/num_positives": 4, - "train/positive_loss": 1.7146966457366943, - "train/total_loss": 0.8477634787559509 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.15020757913589478, - "train/contrastive_loss": 1.4511749744415283, - "train/negative_loss": 0.6382017135620117, - "train/num_negatives": 22, - "train/num_positives": 28, - "train/positive_loss": 0.8129732608795166, - "train/total_loss": 0.44044259190559387 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1441897302865982, - "train/contrastive_loss": 1.0039244890213013, - "train/negative_loss": 0.9898579120635986, - "train/num_negatives": 54, - "train/num_positives": 2, - "train/positive_loss": 0.014066582545638084, - "train/total_loss": 0.3449746370315552 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.22099320590496063, - "train/contrastive_loss": 1.4509962797164917, - "train/negative_loss": 1.1877567768096924, - "train/num_negatives": 46, - "train/num_positives": 8, - "train/positive_loss": 0.2632395029067993, - "train/total_loss": 0.5111924409866333 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.19294436275959015, - "train/contrastive_loss": 2.8929829597473145, - "train/negative_loss": 2.8928375244140625, - "train/num_negatives": 46, - "train/num_positives": 2, - "train/positive_loss": 0.00014532668865285814, - "train/total_loss": 0.7715409398078918 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.14958779513835907, - "train/contrastive_loss": 1.2318429946899414, - "train/negative_loss": 0.9010266661643982, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.330816388130188, - "train/total_loss": 0.3959563970565796 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.16028200089931488, - "train/contrastive_loss": 2.162405490875244, - "train/negative_loss": 1.864552617073059, - "train/num_negatives": 36, - "train/num_positives": 18, - "train/positive_loss": 0.29785284399986267, - "train/total_loss": 0.5927631258964539 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1668495237827301, - "train/contrastive_loss": 1.9806408882141113, - "train/negative_loss": 0.40435096621513367, - "train/num_negatives": 42, - "train/num_positives": 12, - "train/positive_loss": 1.5762898921966553, - "train/total_loss": 0.56297767162323 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.17662976682186127, - "train/contrastive_loss": 1.5506794452667236, - "train/negative_loss": 0.6417889595031738, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 0.9088905453681946, - "train/total_loss": 0.48676568269729614 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.15040795505046844, - "train/contrastive_loss": 1.8176974058151245, - "train/negative_loss": 0.6878343820571899, - "train/num_negatives": 40, - "train/num_positives": 14, - "train/positive_loss": 1.1298630237579346, - "train/total_loss": 0.5139474272727966 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.27257877588272095, - "train/contrastive_loss": 0.9601985216140747, - "train/negative_loss": 0.581061065196991, - "train/num_negatives": 48, - "train/num_positives": 6, - "train/positive_loss": 0.37913745641708374, - "train/total_loss": 0.4646185040473938 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.12818415462970734, - "train/contrastive_loss": 1.0063809156417847, - "train/negative_loss": 1.0063761472702026, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 4.798192549060332e-06, - "train/total_loss": 0.3294603228569031 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.14363479614257812, - "train/contrastive_loss": 1.4797769784927368, - "train/negative_loss": 0.13739828765392303, - "train/num_negatives": 38, - "train/num_positives": 16, - "train/positive_loss": 1.3423787355422974, - "train/total_loss": 0.439590185880661 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.07325965911149979, - "train/contrastive_loss": 0.8241481184959412, - "train/negative_loss": 0.8237775564193726, - "train/num_negatives": 30, - "train/num_positives": 20, - "train/positive_loss": 0.00037055189022794366, - "train/total_loss": 0.23808929324150085 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.13937658071517944, - "train/contrastive_loss": 0.8849582076072693, - "train/negative_loss": 0.8803173303604126, - "train/num_negatives": 28, - "train/num_positives": 12, - "train/positive_loss": 0.004640848375856876, - "train/total_loss": 0.3163682222366333 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.15975762903690338, - "train/contrastive_loss": 1.9268800020217896, - "train/negative_loss": 0.8545734882354736, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 1.072306513786316, - "train/total_loss": 0.545133650302887 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1412896066904068, - "train/contrastive_loss": 0.5322701930999756, - "train/negative_loss": 0.2074510008096695, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.3248192071914673, - "train/total_loss": 0.2477436363697052 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1911468505859375, - "train/contrastive_loss": 2.0196194648742676, - "train/negative_loss": 1.2818200588226318, - "train/num_negatives": 42, - "train/num_positives": 14, - "train/positive_loss": 0.7377994656562805, - "train/total_loss": 0.5950707197189331 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.21257223188877106, - "train/contrastive_loss": 3.061587333679199, - "train/negative_loss": 2.004246234893799, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 1.05734121799469, - "train/total_loss": 0.8248897194862366 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1259741485118866, - "train/contrastive_loss": 1.1490893363952637, - "train/negative_loss": 0.19774097204208374, - "train/num_negatives": 40, - "train/num_positives": 10, - "train/positive_loss": 0.9513483047485352, - "train/total_loss": 0.35579201579093933 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1917337030172348, - "train/contrastive_loss": 2.6345772743225098, - "train/negative_loss": 1.8099431991577148, - "train/num_negatives": 50, - "train/num_positives": 6, - "train/positive_loss": 0.8246341943740845, - "train/total_loss": 0.7186492085456848 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.3333616554737091, - "train/contrastive_loss": 3.9554309844970703, - "train/negative_loss": 1.692263126373291, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 2.2631678581237793, - "train/total_loss": 1.1244478225708008 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.2629888653755188, - "train/contrastive_loss": 2.9074599742889404, - "train/negative_loss": 1.4084110260009766, - "train/num_negatives": 48, - "train/num_positives": 8, - "train/positive_loss": 1.4990489482879639, - "train/total_loss": 0.8444808721542358 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.16768909990787506, - "train/contrastive_loss": 1.1091651916503906, - "train/negative_loss": 0.902595579624176, - "train/num_negatives": 34, - "train/num_positives": 22, - "train/positive_loss": 0.206569641828537, - "train/total_loss": 0.38952213525772095 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.24312318861484528, - "train/contrastive_loss": 3.0809624195098877, - "train/negative_loss": 1.4020813703536987, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.678881049156189, - "train/total_loss": 0.8593156933784485 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.27698802947998047, - "train/contrastive_loss": 3.670548439025879, - "train/negative_loss": 2.9659416675567627, - "train/num_negatives": 16, - "train/num_positives": 22, - "train/positive_loss": 0.704606831073761, - "train/total_loss": 1.0110976696014404 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.3381383717060089, - "train/contrastive_loss": 2.9802634716033936, - "train/negative_loss": 1.7496527433395386, - "train/num_negatives": 46, - "train/num_positives": 10, - "train/positive_loss": 1.230610728263855, - "train/total_loss": 0.934191107749939 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.1089669018983841, - "train/contrastive_loss": 0.18735912442207336, - "train/negative_loss": 0.18735823035240173, - "train/num_negatives": 48, - "train/num_positives": 4, - "train/positive_loss": 8.940701263782103e-07, - "train/total_loss": 0.14643873274326324 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.2013651728630066, - "train/contrastive_loss": 1.3569034337997437, - "train/negative_loss": 0.8839617371559143, - "train/num_negatives": 38, - "train/num_positives": 18, - "train/positive_loss": 0.47294172644615173, - "train/total_loss": 0.4727458655834198 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.11356393247842789, - "train/contrastive_loss": 1.4718523025512695, - "train/negative_loss": 0.5226961970329285, - "train/num_negatives": 46, - "train/num_positives": 6, - "train/positive_loss": 0.9491561651229858, - "train/total_loss": 0.40793439745903015 - }, - { - "epoch": 19.771863117870723, - "step": 5200, - "train/classification_loss": 0.2094537615776062, - "train/contrastive_loss": 1.7808104753494263, - "train/negative_loss": 1.7808104753494263, - "train/num_negatives": 18, - "train/num_positives": 0, - "train/positive_loss": 0.0, - "train/total_loss": 0.5656158924102783 - }, - { - "epoch": 19.771863117870723, - "eval_exact_match_accuracy": 0.36, - "eval_hamming_loss": 0.06352941176470588, - "eval_loss": 0.5491193532943726, - "eval_macro_f1": 0.46019892965671766, - "eval_macro_precision": 0.5561144645801837, - "eval_macro_recall": 0.40349396101515433, - "eval_micro_f1": 0.6339573918657199, - "eval_micro_precision": 0.7328358208955223, - "eval_micro_recall": 0.558589306029579, - "eval_runtime": 2.6312, - "eval_samples_per_second": 199.526, - "eval_steps_per_second": 25.083, - "step": 5200 - }, - { - "epoch": 19.771863117870723, - "step": 5200, + "epoch": 11.971830985915492, + "step": 3400, "total_flos": 0.0, - "train_loss": 0.7332356544641349, - "train_runtime": 1473.3753, - "train_samples_per_second": 1426.317, - "train_steps_per_second": 89.251 + "train_loss": 0.9307791737949147, + "train_runtime": 983.1644, + "train_samples_per_second": 2307.854, + "train_steps_per_second": 144.432 } ], "logging_steps": 50, - "max_steps": 131500, + "max_steps": 142000, "num_input_tokens_seen": 0, "num_train_epochs": 500, "save_steps": 2000,