Upload 42_add_dilation_loss_for_token_logits_43's state dict
Browse files- .gitattributes +1 -0
- 42_add_dilation_loss_for_token_logits_43/lasts/42_add_dilation_loss_for_token_logits_43_s26092004_f0_last_ema.pth +3 -0
- 42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_log_plot.jpg +3 -0
- 42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_s26092004_f0_logging.json +1 -0
- 42_add_dilation_loss_for_token_logits_43/r1s/42_add_dilation_loss_for_token_logits_43_s26092004_f0_r1_vs0.46430_ema.pth +3 -0
- 42_add_dilation_loss_for_token_logits_43/results/42_add_dilation_loss_for_token_logits_43_test.json +86 -0
.gitattributes
CHANGED
|
@@ -72,3 +72,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 72 |
35_40_negs_40/logs/35_40_negs_40_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
| 73 |
41_remove_retrieval_from_tokens_42/logs/41_remove_retrieval_from_tokens_42_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
| 74 |
37_30_41/logs/37_30_41_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 72 |
35_40_negs_40/logs/35_40_negs_40_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
| 73 |
41_remove_retrieval_from_tokens_42/logs/41_remove_retrieval_from_tokens_42_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
| 74 |
37_30_41/logs/37_30_41_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
|
42_add_dilation_loss_for_token_logits_43/lasts/42_add_dilation_loss_for_token_logits_43_s26092004_f0_last_ema.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15d5797a4231e9d7106949a9e2c7afd063246c401927bf040115a40d4628d87f
|
| 3 |
+
size 584836960
|
42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_log_plot.jpg
ADDED
|
Git LFS Details
|
42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_s26092004_f0_logging.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"1": {"lr": [2e-05, 0.0005], "train_loss": 1.7462430000305176, "total": 1.7462429470486112, "token_bce": 0.2636160843460648, "token_smooth": 0.5109800437644676, "dilation": 0.32428349247685184, "span_contrastive": 0.7043267144097223, "span_triplet": 0.42962962962962964, "span_ce": 0.18889912923177082}, "2": {"lr": [1.988303923565381e-05, 0.0004969282409784868], "train_loss": 1.3336777687072754, "total": 1.3336777524594907, "token_bce": 0.20739935980902777, "token_smooth": 0.49858036747685186, "dilation": 0.2600263129340278, "span_contrastive": 0.5221408872251158, "span_triplet": 0.31703703703703706, "span_ce": 0.13495302553530092}, "3": {"lr": [1.9535036904803962e-05, 0.0004877886008156408], "train_loss": 1.2032934427261353, "total": 1.20329345703125, "token_bce": 0.19491963704427084, "token_smooth": 0.48699634693287036, "dilation": 0.2444973415798611, "span_contrastive": 0.45727909794560184, "span_triplet": 0.27574074074074073, "span_ce": 0.11956885443793402}, "4": {"lr": [1.8964561979789496e-05, 0.00047280612778499774], "train_loss": 1.0944128036499023, "total": 1.094412796585648, "token_bce": 0.18452086272063078, "token_smooth": 0.47530024775752316, "dilation": 0.23218505859375, "span_contrastive": 0.4013004105179398, "span_triplet": 0.2424074074074074, "span_ce": 0.10804502133969908}, "5": {"lr": [1.8185661446562005e-05, 0.00045234974009654937], "train_loss": 1.0207452774047852, "total": 1.0207452618634258, "token_bce": 0.17528016266999422, "token_smooth": 0.47418773509837964, "dilation": 0.22174784342447917, "span_contrastive": 0.3678669117115162, "span_triplet": 0.22018518518518518, "span_ce": 0.09872957582826968}, "6": {"lr": [1.7217514421272206e-05, 0.00042692314190604356], "train_loss": 0.9484228491783142, "total": 0.9484228515625, "token_bce": 0.166716229474103, "token_smooth": 0.4774904152199074, "dilation": 0.2118576614945023, "span_contrastive": 0.33283130787037035, "span_triplet": 0.19518518518518518, "span_ce": 0.09134540134006076}, "7": {"lr": [1.60839598967785e-05, 0.00039715242044697206], "train_loss": 0.8921521306037903, "total": 0.8921521448206019, "token_bce": 0.15747964364510994, "token_smooth": 0.4827188675491898, "dilation": 0.20180858470775462, "span_contrastive": 0.3075924117476852, "span_triplet": 0.1827777777777778, "span_ce": 0.08592472782841436}, "8": {"lr": [1.4812909747525698e-05, 0.00036377062968501693], "train_loss": 0.8299175500869751, "total": 0.8299175347222222, "token_bce": 0.1489540269639757, "token_smooth": 0.4829901801215278, "dilation": 0.19281021683304397, "span_contrastive": 0.27897951479311345, "span_triplet": 0.16268518518518518, "span_ce": 0.0792928625036169, "val_score": 0.42744371676604714, "best_score": 0.42744371676604714, "new_best_model": true, "precision@3": 0.1965177048101333, "recall@3": 0.530418325304959, "f1@3": 0.28670349083856006, "precision_soft@3": 0.2929707713555161, "recall_soft@3": 0.7908875396317571, "f1_soft@3": 0.42744371676604714}, "9": {"lr": [1.3435661446562005e-05, 0.0003275997400965494], "train_loss": 0.776001513004303, "total": 0.7760015190972223, "token_bce": 0.1419445913809317, "token_smooth": 0.4855345775462963, "dilation": 0.18532076235170716, "span_contrastive": 0.252571863245081, "span_triplet": 0.14833333333333334, "span_ce": 0.07349824693467882, "val_score": 0.42801170781221104, "best_score": 0.42801170781221104, "new_best_model": true, "precision@3": 0.19845370828251518, "recall@3": 0.5341370011688671, "f1@3": 0.2892948451630314, "precision_soft@3": 0.2935730290270333, "recall_soft@3": 0.7905202735232886, "f1_soft@3": 0.42801170781221104}, "10": {"lr": [1.1986127417882198e-05, 0.00028953039902753766], "train_loss": 0.730533242225647, "total": 0.7305332212094907, "token_bce": 0.13482808430989585, "token_smooth": 0.485777904369213, "dilation": 0.17757729989510995, "span_contrastive": 0.23368607132523148, "span_triplet": 0.13824074074074075, "span_ce": 0.06673768785264757, "val_score": 0.4308789724238528, "best_score": 0.4308789724238528, "new_best_model": true, "precision@3": 0.1994629552521267, "recall@3": 0.5300510591964904, "f1@3": 0.2897516989284916, "precision_soft@3": 0.29659413347437763, "recall_soft@3": 0.7883337193833123, "f1_soft@3": 0.4308789724238528}, "11": {"lr": [1.0500000000000003e-05, 0.0002505], "train_loss": 0.6906977891921997, "total": 0.6906977900752315, "token_bce": 0.1281228185583044, "token_smooth": 0.48839934172453703, "dilation": 0.1714169876663773, "span_contrastive": 0.2165081787109375, "span_triplet": 0.12768518518518518, "span_ce": 0.0619825914171007, "val_score": 0.4344366933568109, "best_score": 0.4344366933568109, "new_best_model": true, "precision@3": 0.200514348971081, "recall@3": 0.5240043763527353, "f1@3": 0.28993934168780405, "precision_soft@3": 0.30038825962944765, "recall_soft@3": 0.7855217050957631, "f1_soft@3": 0.4344366933568109}, "12": {"lr": [9.013872582117811e-06, 0.00021146960097246246], "train_loss": 0.639044463634491, "total": 0.6390444607204862, "token_bce": 0.12305115876374421, "token_smooth": 0.4892825882523148, "dilation": 0.16562419750072338, "span_contrastive": 0.1895014444986979, "span_triplet": 0.11166666666666666, "span_ce": 0.05598465530960648, "val_score": 0.4377692076802983, "best_score": 0.4377692076802983, "new_best_model": true, "precision@3": 0.20251423260184695, "recall@3": 0.5203001866230301, "f1@3": 0.291424743683959, "precision_soft@3": 0.30414550561703696, "recall_soft@3": 0.7819904968510238, "f1_soft@3": 0.4377692076802983}, "13": {"lr": [7.564338553438001e-06, 0.00017340025990345064], "train_loss": 0.6190622448921204, "total": 0.6190622287326389, "token_bce": 0.11804774531611689, "token_smooth": 0.4910555465133102, "dilation": 0.16060821533203126, "span_contrastive": 0.18485634132667825, "span_triplet": 0.10898148148148148, "span_ce": 0.05175048262984664, "val_score": 0.4434620939849902, "best_score": 0.4434620939849902, "new_best_model": true, "precision@3": 0.20445519790756514, "recall@3": 0.514626734766467, "f1@3": 0.29249657953237834, "precision_soft@3": 0.30993478680471515, "recall_soft@3": 0.7805231366682371, "f1_soft@3": 0.4434620939849902}, "14": {"lr": [6.1870902524743065e-06, 0.00013722937031498307], "train_loss": 0.5810005068778992, "total": 0.5810004792390047, "token_bce": 0.11407884385850695, "token_smooth": 0.4919797092013889, "dilation": 0.15709197998046875, "span_contrastive": 0.16475484212239583, "span_triplet": 0.09731481481481481, "span_ce": 0.047098973592122395, "val_score": 0.4491814955765573, "best_score": 0.4491814955765573, "new_best_model": true, "precision@3": 0.20807857473496577, "recall@3": 0.5126370216266161, "f1@3": 0.295831800370707, "precision_soft@3": 0.3158892890082118, "recall_soft@3": 0.7786655029873666, "f1_soft@3": 0.4491814955765573}, "15": {"lr": [4.916040103221507e-06, 0.00010384757955302797], "train_loss": 0.5580182671546936, "total": 0.5580182562934027, "token_bce": 0.11126241048177084, "token_smooth": 0.4931563313802083, "dilation": 0.15409192120587384, "span_contrastive": 0.15438779477719908, "span_triplet": 0.09078703703703704, "span_ce": 0.04364092508951823, "val_score": 0.45184009683921444, "best_score": 0.45184009683921444, "new_best_model": true, "precision@3": 0.20868124824825746, "recall@3": 0.5022112656241178, "f1@3": 0.2946372891040595, "precision_soft@3": 0.3199986998899058, "recall_soft@3": 0.7703061514234444, "f1_soft@3": 0.45184009683921444}, "16": {"lr": [3.7824855787278e-06, 7.40768580939564e-05], "train_loss": 0.5451138615608215, "total": 0.5451138870804398, "token_bce": 0.10881063955801505, "token_smooth": 0.49385398582175927, "dilation": 0.1516392347547743, "span_contrastive": 0.14960634584780091, "span_triplet": 0.08828703703703704, "span_ce": 0.0415204111735026, "val_score": 0.45583425284999385, "best_score": 0.45583425284999385, "new_best_model": true, "precision@3": 0.21006875131347477, "recall@3": 0.4931301637263824, "f1@3": 0.2943917904907063, "precision_soft@3": 0.32522429321936674, "recall_soft@3": 0.76380187716377, "f1_soft@3": 0.45583425284999385}, "17": {"lr": [2.814338553438001e-06, 4.865025990345063e-05], "train_loss": 0.5261017680168152, "total": 0.5261017523871527, "token_bce": 0.10668060302734375, "token_smooth": 0.4929262514467593, "dilation": 0.1492363710756655, "span_contrastive": 0.13998194941767939, "span_triplet": 0.08236111111111111, "span_ce": 0.039466312549732346, "val_score": 0.45916970536273743, "best_score": 0.45916970536273743, "new_best_model": true, "precision@3": 0.2109984194999653, "recall@3": 0.4840047513004945, "f1@3": 0.29364798277801296, "precision_soft@3": 0.32991277092817434, "recall_soft@3": 0.7569337452977937, "f1_soft@3": 0.45916970536273743}, "18": {"lr": [2.0354380202105066e-06, 2.8193872215002235e-05], "train_loss": 0.5028696060180664, "total": 0.5028696017795139, "token_bce": 0.10478624131944445, "token_smooth": 0.4946022768373843, "dilation": 0.14765551531756366, "span_contrastive": 0.12705839934172453, "span_triplet": 0.07393518518518519, "span_ce": 0.036977719907407405, "val_score": 0.4643015639624314, "best_score": 0.4643015639624314, "new_best_model": true, "precision@3": 0.21411629852172517, "recall@3": 0.4786627762796602, "f1@3": 0.295614196868657, "precision_soft@3": 0.3362673576990195, "recall_soft@3": 0.7519351768702682, "f1_soft@3": 0.4643015639624314}}
|
42_add_dilation_loss_for_token_logits_43/r1s/42_add_dilation_loss_for_token_logits_43_s26092004_f0_r1_vs0.46430_ema.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c17f9f6db408e87673371d16bf5142edde96ebf8c7d6475844a5d81dd4f8d333
|
| 3 |
+
size 584846504
|
42_add_dilation_loss_for_token_logits_43/results/42_add_dilation_loss_for_token_logits_43_test.json
ADDED
|
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"Best model": {
|
| 3 |
+
"1": {
|
| 4 |
+
"precision@1": 0.2762645914387115,
|
| 5 |
+
"recall@1": 0.2669172932321705,
|
| 6 |
+
"f1@1": 0.2715105112529269,
|
| 7 |
+
"precision_soft@1": 0.6101874778895996,
|
| 8 |
+
"recall_soft@1": 0.5895420369084431,
|
| 9 |
+
"f1_soft@1": 0.5996871147629975
|
| 10 |
+
},
|
| 11 |
+
"2": {
|
| 12 |
+
"precision@2": 0.23935854286232558,
|
| 13 |
+
"recall@2": 0.4131920710853958,
|
| 14 |
+
"f1@2": 0.3031214695924961,
|
| 15 |
+
"precision_soft@2": 0.41437339140682167,
|
| 16 |
+
"recall_soft@2": 0.7153110047822443,
|
| 17 |
+
"f1_soft@2": 0.5247586765619793
|
| 18 |
+
},
|
| 19 |
+
"3": {
|
| 20 |
+
"precision@3": 0.22253000923326788,
|
| 21 |
+
"recall@3": 0.49419002050412103,
|
| 22 |
+
"f1@3": 0.30687605683821934,
|
| 23 |
+
"precision_soft@3": 0.34256694367444973,
|
| 24 |
+
"recall_soft@3": 0.7607655502366345,
|
| 25 |
+
"f1_soft@3": 0.47241086159168805
|
| 26 |
+
},
|
| 27 |
+
"4": {
|
| 28 |
+
"precision@4": 0.21454792658026575,
|
| 29 |
+
"recall@4": 0.5393028024588541,
|
| 30 |
+
"f1@4": 0.30697402569096477,
|
| 31 |
+
"precision_soft@4": 0.3118966689322748,
|
| 32 |
+
"recall_soft@4": 0.7840054682133151,
|
| 33 |
+
"f1_soft@4": 0.44626008735784684
|
| 34 |
+
},
|
| 35 |
+
"5": {
|
| 36 |
+
"precision@5": 0.21289752650149812,
|
| 37 |
+
"recall@5": 0.5765550239214745,
|
| 38 |
+
"f1@5": 0.31096773799588057,
|
| 39 |
+
"precision_soft@5": 0.2965673902065919,
|
| 40 |
+
"recall_soft@5": 0.8031442241941109,
|
| 41 |
+
"f1_soft@5": 0.4331797195624755
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"Last model": {
|
| 45 |
+
"1": {
|
| 46 |
+
"precision@1": 0.2762645914387115,
|
| 47 |
+
"recall@1": 0.2669172932321705,
|
| 48 |
+
"f1@1": 0.2715105112529269,
|
| 49 |
+
"precision_soft@1": 0.6101874778895996,
|
| 50 |
+
"recall_soft@1": 0.5895420369084431,
|
| 51 |
+
"f1_soft@1": 0.5996871147629975
|
| 52 |
+
},
|
| 53 |
+
"2": {
|
| 54 |
+
"precision@2": 0.23935854286232558,
|
| 55 |
+
"recall@2": 0.4131920710853958,
|
| 56 |
+
"f1@2": 0.3031214695924961,
|
| 57 |
+
"precision_soft@2": 0.41437339140682167,
|
| 58 |
+
"recall_soft@2": 0.7153110047822443,
|
| 59 |
+
"f1_soft@2": 0.5247586765619793
|
| 60 |
+
},
|
| 61 |
+
"3": {
|
| 62 |
+
"precision@3": 0.22253000923326788,
|
| 63 |
+
"recall@3": 0.49419002050412103,
|
| 64 |
+
"f1@3": 0.30687605683821934,
|
| 65 |
+
"precision_soft@3": 0.34256694367444973,
|
| 66 |
+
"recall_soft@3": 0.7607655502366345,
|
| 67 |
+
"f1_soft@3": 0.47241086159168805
|
| 68 |
+
},
|
| 69 |
+
"4": {
|
| 70 |
+
"precision@4": 0.21454792658026575,
|
| 71 |
+
"recall@4": 0.5393028024588541,
|
| 72 |
+
"f1@4": 0.30697402569096477,
|
| 73 |
+
"precision_soft@4": 0.3118966689322748,
|
| 74 |
+
"recall_soft@4": 0.7840054682133151,
|
| 75 |
+
"f1_soft@4": 0.44626008735784684
|
| 76 |
+
},
|
| 77 |
+
"5": {
|
| 78 |
+
"precision@5": 0.21289752650149812,
|
| 79 |
+
"recall@5": 0.5765550239214745,
|
| 80 |
+
"f1@5": 0.31096773799588057,
|
| 81 |
+
"precision_soft@5": 0.2965673902065919,
|
| 82 |
+
"recall_soft@5": 0.8031442241941109,
|
| 83 |
+
"f1_soft@5": 0.4331797195624755
|
| 84 |
+
}
|
| 85 |
+
}
|
| 86 |
+
}
|