SS3M commited on
Commit
593eaec
·
verified ·
1 Parent(s): 8f5a488

Upload 42_add_dilation_loss_for_token_logits_43's state dict

Browse files
.gitattributes CHANGED
@@ -72,3 +72,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
72
  35_40_negs_40/logs/35_40_negs_40_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
73
  41_remove_retrieval_from_tokens_42/logs/41_remove_retrieval_from_tokens_42_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
74
  37_30_41/logs/37_30_41_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
 
 
72
  35_40_negs_40/logs/35_40_negs_40_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
73
  41_remove_retrieval_from_tokens_42/logs/41_remove_retrieval_from_tokens_42_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
74
  37_30_41/logs/37_30_41_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
75
+ 42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_log_plot.jpg filter=lfs diff=lfs merge=lfs -text
42_add_dilation_loss_for_token_logits_43/lasts/42_add_dilation_loss_for_token_logits_43_s26092004_f0_last_ema.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15d5797a4231e9d7106949a9e2c7afd063246c401927bf040115a40d4628d87f
3
+ size 584836960
42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_log_plot.jpg ADDED

Git LFS Details

  • SHA256: 883d431df98b041e2a62675cb0a97e8f8a234b4a2c475f24e02cdd0b38d1423b
  • Pointer size: 131 Bytes
  • Size of remote file: 476 kB
42_add_dilation_loss_for_token_logits_43/logs/42_add_dilation_loss_for_token_logits_43_s26092004_f0_logging.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"1": {"lr": [2e-05, 0.0005], "train_loss": 1.7462430000305176, "total": 1.7462429470486112, "token_bce": 0.2636160843460648, "token_smooth": 0.5109800437644676, "dilation": 0.32428349247685184, "span_contrastive": 0.7043267144097223, "span_triplet": 0.42962962962962964, "span_ce": 0.18889912923177082}, "2": {"lr": [1.988303923565381e-05, 0.0004969282409784868], "train_loss": 1.3336777687072754, "total": 1.3336777524594907, "token_bce": 0.20739935980902777, "token_smooth": 0.49858036747685186, "dilation": 0.2600263129340278, "span_contrastive": 0.5221408872251158, "span_triplet": 0.31703703703703706, "span_ce": 0.13495302553530092}, "3": {"lr": [1.9535036904803962e-05, 0.0004877886008156408], "train_loss": 1.2032934427261353, "total": 1.20329345703125, "token_bce": 0.19491963704427084, "token_smooth": 0.48699634693287036, "dilation": 0.2444973415798611, "span_contrastive": 0.45727909794560184, "span_triplet": 0.27574074074074073, "span_ce": 0.11956885443793402}, "4": {"lr": [1.8964561979789496e-05, 0.00047280612778499774], "train_loss": 1.0944128036499023, "total": 1.094412796585648, "token_bce": 0.18452086272063078, "token_smooth": 0.47530024775752316, "dilation": 0.23218505859375, "span_contrastive": 0.4013004105179398, "span_triplet": 0.2424074074074074, "span_ce": 0.10804502133969908}, "5": {"lr": [1.8185661446562005e-05, 0.00045234974009654937], "train_loss": 1.0207452774047852, "total": 1.0207452618634258, "token_bce": 0.17528016266999422, "token_smooth": 0.47418773509837964, "dilation": 0.22174784342447917, "span_contrastive": 0.3678669117115162, "span_triplet": 0.22018518518518518, "span_ce": 0.09872957582826968}, "6": {"lr": [1.7217514421272206e-05, 0.00042692314190604356], "train_loss": 0.9484228491783142, "total": 0.9484228515625, "token_bce": 0.166716229474103, "token_smooth": 0.4774904152199074, "dilation": 0.2118576614945023, "span_contrastive": 0.33283130787037035, "span_triplet": 0.19518518518518518, "span_ce": 0.09134540134006076}, "7": {"lr": [1.60839598967785e-05, 0.00039715242044697206], "train_loss": 0.8921521306037903, "total": 0.8921521448206019, "token_bce": 0.15747964364510994, "token_smooth": 0.4827188675491898, "dilation": 0.20180858470775462, "span_contrastive": 0.3075924117476852, "span_triplet": 0.1827777777777778, "span_ce": 0.08592472782841436}, "8": {"lr": [1.4812909747525698e-05, 0.00036377062968501693], "train_loss": 0.8299175500869751, "total": 0.8299175347222222, "token_bce": 0.1489540269639757, "token_smooth": 0.4829901801215278, "dilation": 0.19281021683304397, "span_contrastive": 0.27897951479311345, "span_triplet": 0.16268518518518518, "span_ce": 0.0792928625036169, "val_score": 0.42744371676604714, "best_score": 0.42744371676604714, "new_best_model": true, "precision@3": 0.1965177048101333, "recall@3": 0.530418325304959, "f1@3": 0.28670349083856006, "precision_soft@3": 0.2929707713555161, "recall_soft@3": 0.7908875396317571, "f1_soft@3": 0.42744371676604714}, "9": {"lr": [1.3435661446562005e-05, 0.0003275997400965494], "train_loss": 0.776001513004303, "total": 0.7760015190972223, "token_bce": 0.1419445913809317, "token_smooth": 0.4855345775462963, "dilation": 0.18532076235170716, "span_contrastive": 0.252571863245081, "span_triplet": 0.14833333333333334, "span_ce": 0.07349824693467882, "val_score": 0.42801170781221104, "best_score": 0.42801170781221104, "new_best_model": true, "precision@3": 0.19845370828251518, "recall@3": 0.5341370011688671, "f1@3": 0.2892948451630314, "precision_soft@3": 0.2935730290270333, "recall_soft@3": 0.7905202735232886, "f1_soft@3": 0.42801170781221104}, "10": {"lr": [1.1986127417882198e-05, 0.00028953039902753766], "train_loss": 0.730533242225647, "total": 0.7305332212094907, "token_bce": 0.13482808430989585, "token_smooth": 0.485777904369213, "dilation": 0.17757729989510995, "span_contrastive": 0.23368607132523148, "span_triplet": 0.13824074074074075, "span_ce": 0.06673768785264757, "val_score": 0.4308789724238528, "best_score": 0.4308789724238528, "new_best_model": true, "precision@3": 0.1994629552521267, "recall@3": 0.5300510591964904, "f1@3": 0.2897516989284916, "precision_soft@3": 0.29659413347437763, "recall_soft@3": 0.7883337193833123, "f1_soft@3": 0.4308789724238528}, "11": {"lr": [1.0500000000000003e-05, 0.0002505], "train_loss": 0.6906977891921997, "total": 0.6906977900752315, "token_bce": 0.1281228185583044, "token_smooth": 0.48839934172453703, "dilation": 0.1714169876663773, "span_contrastive": 0.2165081787109375, "span_triplet": 0.12768518518518518, "span_ce": 0.0619825914171007, "val_score": 0.4344366933568109, "best_score": 0.4344366933568109, "new_best_model": true, "precision@3": 0.200514348971081, "recall@3": 0.5240043763527353, "f1@3": 0.28993934168780405, "precision_soft@3": 0.30038825962944765, "recall_soft@3": 0.7855217050957631, "f1_soft@3": 0.4344366933568109}, "12": {"lr": [9.013872582117811e-06, 0.00021146960097246246], "train_loss": 0.639044463634491, "total": 0.6390444607204862, "token_bce": 0.12305115876374421, "token_smooth": 0.4892825882523148, "dilation": 0.16562419750072338, "span_contrastive": 0.1895014444986979, "span_triplet": 0.11166666666666666, "span_ce": 0.05598465530960648, "val_score": 0.4377692076802983, "best_score": 0.4377692076802983, "new_best_model": true, "precision@3": 0.20251423260184695, "recall@3": 0.5203001866230301, "f1@3": 0.291424743683959, "precision_soft@3": 0.30414550561703696, "recall_soft@3": 0.7819904968510238, "f1_soft@3": 0.4377692076802983}, "13": {"lr": [7.564338553438001e-06, 0.00017340025990345064], "train_loss": 0.6190622448921204, "total": 0.6190622287326389, "token_bce": 0.11804774531611689, "token_smooth": 0.4910555465133102, "dilation": 0.16060821533203126, "span_contrastive": 0.18485634132667825, "span_triplet": 0.10898148148148148, "span_ce": 0.05175048262984664, "val_score": 0.4434620939849902, "best_score": 0.4434620939849902, "new_best_model": true, "precision@3": 0.20445519790756514, "recall@3": 0.514626734766467, "f1@3": 0.29249657953237834, "precision_soft@3": 0.30993478680471515, "recall_soft@3": 0.7805231366682371, "f1_soft@3": 0.4434620939849902}, "14": {"lr": [6.1870902524743065e-06, 0.00013722937031498307], "train_loss": 0.5810005068778992, "total": 0.5810004792390047, "token_bce": 0.11407884385850695, "token_smooth": 0.4919797092013889, "dilation": 0.15709197998046875, "span_contrastive": 0.16475484212239583, "span_triplet": 0.09731481481481481, "span_ce": 0.047098973592122395, "val_score": 0.4491814955765573, "best_score": 0.4491814955765573, "new_best_model": true, "precision@3": 0.20807857473496577, "recall@3": 0.5126370216266161, "f1@3": 0.295831800370707, "precision_soft@3": 0.3158892890082118, "recall_soft@3": 0.7786655029873666, "f1_soft@3": 0.4491814955765573}, "15": {"lr": [4.916040103221507e-06, 0.00010384757955302797], "train_loss": 0.5580182671546936, "total": 0.5580182562934027, "token_bce": 0.11126241048177084, "token_smooth": 0.4931563313802083, "dilation": 0.15409192120587384, "span_contrastive": 0.15438779477719908, "span_triplet": 0.09078703703703704, "span_ce": 0.04364092508951823, "val_score": 0.45184009683921444, "best_score": 0.45184009683921444, "new_best_model": true, "precision@3": 0.20868124824825746, "recall@3": 0.5022112656241178, "f1@3": 0.2946372891040595, "precision_soft@3": 0.3199986998899058, "recall_soft@3": 0.7703061514234444, "f1_soft@3": 0.45184009683921444}, "16": {"lr": [3.7824855787278e-06, 7.40768580939564e-05], "train_loss": 0.5451138615608215, "total": 0.5451138870804398, "token_bce": 0.10881063955801505, "token_smooth": 0.49385398582175927, "dilation": 0.1516392347547743, "span_contrastive": 0.14960634584780091, "span_triplet": 0.08828703703703704, "span_ce": 0.0415204111735026, "val_score": 0.45583425284999385, "best_score": 0.45583425284999385, "new_best_model": true, "precision@3": 0.21006875131347477, "recall@3": 0.4931301637263824, "f1@3": 0.2943917904907063, "precision_soft@3": 0.32522429321936674, "recall_soft@3": 0.76380187716377, "f1_soft@3": 0.45583425284999385}, "17": {"lr": [2.814338553438001e-06, 4.865025990345063e-05], "train_loss": 0.5261017680168152, "total": 0.5261017523871527, "token_bce": 0.10668060302734375, "token_smooth": 0.4929262514467593, "dilation": 0.1492363710756655, "span_contrastive": 0.13998194941767939, "span_triplet": 0.08236111111111111, "span_ce": 0.039466312549732346, "val_score": 0.45916970536273743, "best_score": 0.45916970536273743, "new_best_model": true, "precision@3": 0.2109984194999653, "recall@3": 0.4840047513004945, "f1@3": 0.29364798277801296, "precision_soft@3": 0.32991277092817434, "recall_soft@3": 0.7569337452977937, "f1_soft@3": 0.45916970536273743}, "18": {"lr": [2.0354380202105066e-06, 2.8193872215002235e-05], "train_loss": 0.5028696060180664, "total": 0.5028696017795139, "token_bce": 0.10478624131944445, "token_smooth": 0.4946022768373843, "dilation": 0.14765551531756366, "span_contrastive": 0.12705839934172453, "span_triplet": 0.07393518518518519, "span_ce": 0.036977719907407405, "val_score": 0.4643015639624314, "best_score": 0.4643015639624314, "new_best_model": true, "precision@3": 0.21411629852172517, "recall@3": 0.4786627762796602, "f1@3": 0.295614196868657, "precision_soft@3": 0.3362673576990195, "recall_soft@3": 0.7519351768702682, "f1_soft@3": 0.4643015639624314}}
42_add_dilation_loss_for_token_logits_43/r1s/42_add_dilation_loss_for_token_logits_43_s26092004_f0_r1_vs0.46430_ema.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c17f9f6db408e87673371d16bf5142edde96ebf8c7d6475844a5d81dd4f8d333
3
+ size 584846504
42_add_dilation_loss_for_token_logits_43/results/42_add_dilation_loss_for_token_logits_43_test.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Best model": {
3
+ "1": {
4
+ "precision@1": 0.2762645914387115,
5
+ "recall@1": 0.2669172932321705,
6
+ "f1@1": 0.2715105112529269,
7
+ "precision_soft@1": 0.6101874778895996,
8
+ "recall_soft@1": 0.5895420369084431,
9
+ "f1_soft@1": 0.5996871147629975
10
+ },
11
+ "2": {
12
+ "precision@2": 0.23935854286232558,
13
+ "recall@2": 0.4131920710853958,
14
+ "f1@2": 0.3031214695924961,
15
+ "precision_soft@2": 0.41437339140682167,
16
+ "recall_soft@2": 0.7153110047822443,
17
+ "f1_soft@2": 0.5247586765619793
18
+ },
19
+ "3": {
20
+ "precision@3": 0.22253000923326788,
21
+ "recall@3": 0.49419002050412103,
22
+ "f1@3": 0.30687605683821934,
23
+ "precision_soft@3": 0.34256694367444973,
24
+ "recall_soft@3": 0.7607655502366345,
25
+ "f1_soft@3": 0.47241086159168805
26
+ },
27
+ "4": {
28
+ "precision@4": 0.21454792658026575,
29
+ "recall@4": 0.5393028024588541,
30
+ "f1@4": 0.30697402569096477,
31
+ "precision_soft@4": 0.3118966689322748,
32
+ "recall_soft@4": 0.7840054682133151,
33
+ "f1_soft@4": 0.44626008735784684
34
+ },
35
+ "5": {
36
+ "precision@5": 0.21289752650149812,
37
+ "recall@5": 0.5765550239214745,
38
+ "f1@5": 0.31096773799588057,
39
+ "precision_soft@5": 0.2965673902065919,
40
+ "recall_soft@5": 0.8031442241941109,
41
+ "f1_soft@5": 0.4331797195624755
42
+ }
43
+ },
44
+ "Last model": {
45
+ "1": {
46
+ "precision@1": 0.2762645914387115,
47
+ "recall@1": 0.2669172932321705,
48
+ "f1@1": 0.2715105112529269,
49
+ "precision_soft@1": 0.6101874778895996,
50
+ "recall_soft@1": 0.5895420369084431,
51
+ "f1_soft@1": 0.5996871147629975
52
+ },
53
+ "2": {
54
+ "precision@2": 0.23935854286232558,
55
+ "recall@2": 0.4131920710853958,
56
+ "f1@2": 0.3031214695924961,
57
+ "precision_soft@2": 0.41437339140682167,
58
+ "recall_soft@2": 0.7153110047822443,
59
+ "f1_soft@2": 0.5247586765619793
60
+ },
61
+ "3": {
62
+ "precision@3": 0.22253000923326788,
63
+ "recall@3": 0.49419002050412103,
64
+ "f1@3": 0.30687605683821934,
65
+ "precision_soft@3": 0.34256694367444973,
66
+ "recall_soft@3": 0.7607655502366345,
67
+ "f1_soft@3": 0.47241086159168805
68
+ },
69
+ "4": {
70
+ "precision@4": 0.21454792658026575,
71
+ "recall@4": 0.5393028024588541,
72
+ "f1@4": 0.30697402569096477,
73
+ "precision_soft@4": 0.3118966689322748,
74
+ "recall_soft@4": 0.7840054682133151,
75
+ "f1_soft@4": 0.44626008735784684
76
+ },
77
+ "5": {
78
+ "precision@5": 0.21289752650149812,
79
+ "recall@5": 0.5765550239214745,
80
+ "f1@5": 0.31096773799588057,
81
+ "precision_soft@5": 0.2965673902065919,
82
+ "recall_soft@5": 0.8031442241941109,
83
+ "f1_soft@5": 0.4331797195624755
84
+ }
85
+ }
86
+ }