Upload sigma_lambda_pure_v1/history.json with huggingface_hub
Browse files
sigma_lambda_pure_v1/history.json
CHANGED
|
@@ -1,73 +1,91 @@
|
|
| 1 |
{
|
| 2 |
"epoch": [
|
| 3 |
1,
|
| 4 |
-
2
|
|
|
|
| 5 |
],
|
| 6 |
"L_ce": [
|
| 7 |
14.331461430318427,
|
| 8 |
-
9.380760340257124
|
|
|
|
| 9 |
],
|
| 10 |
"L_geo": [
|
| 11 |
0.9581514698041208,
|
| 12 |
-
0.6168224997231454
|
|
|
|
| 13 |
],
|
| 14 |
"L_mono": [
|
| 15 |
0.000488300864839623,
|
| 16 |
-
0.0005662547603071399
|
|
|
|
| 17 |
],
|
| 18 |
"ret_loss": [
|
|
|
|
| 19 |
0.0,
|
| 20 |
0.0
|
| 21 |
],
|
| 22 |
"ppl": [
|
| 23 |
3565.3611632608254,
|
| 24 |
-
337.54682195459276
|
|
|
|
| 25 |
],
|
| 26 |
"tf_acc": [
|
| 27 |
0.4297560097089016,
|
| 28 |
-
0.4887341592392626
|
|
|
|
| 29 |
],
|
| 30 |
"fr_acc": [
|
| 31 |
0.0862397060965078,
|
| 32 |
-
0.1707139777687095
|
|
|
|
| 33 |
],
|
| 34 |
"def_rate": [
|
|
|
|
| 35 |
1.0,
|
| 36 |
1.0
|
| 37 |
],
|
| 38 |
"mrr": [
|
| 39 |
0.00940620992332697,
|
| 40 |
-
0.010582948103547096
|
|
|
|
| 41 |
],
|
| 42 |
"r1": [
|
| 43 |
0.0010416667209938169,
|
| 44 |
-
0.0020833334419876337
|
|
|
|
| 45 |
],
|
| 46 |
"ret_ok_pct": [
|
|
|
|
| 47 |
0.0,
|
| 48 |
0.0
|
| 49 |
],
|
| 50 |
"gn_field": [
|
| 51 |
1.637221244392973,
|
| 52 |
-
0.1569300211017782
|
|
|
|
| 53 |
],
|
| 54 |
"gn_gfpd": [
|
| 55 |
296675.0374047661,
|
| 56 |
-
0.12336013482375578
|
|
|
|
| 57 |
],
|
| 58 |
"eta_mu": [
|
| 59 |
0.018591582775115967,
|
| 60 |
-
0.020370446145534515
|
|
|
|
| 61 |
],
|
| 62 |
"eta_h": [
|
| 63 |
0.21234284341335297,
|
| 64 |
-
0.23142163455486298
|
|
|
|
| 65 |
],
|
| 66 |
"beta_mean": [
|
| 67 |
0.11307718604803085,
|
| 68 |
-
0.18666285276412964
|
|
|
|
| 69 |
],
|
| 70 |
"w_ret": [
|
|
|
|
| 71 |
0.0,
|
| 72 |
0.0
|
| 73 |
]
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": [
|
| 3 |
1,
|
| 4 |
+
2,
|
| 5 |
+
3
|
| 6 |
],
|
| 7 |
"L_ce": [
|
| 8 |
14.331461430318427,
|
| 9 |
+
9.380760340257124,
|
| 10 |
+
9.188111376617893
|
| 11 |
],
|
| 12 |
"L_geo": [
|
| 13 |
0.9581514698041208,
|
| 14 |
+
0.6168224997231454,
|
| 15 |
+
0.6412599489363757
|
| 16 |
],
|
| 17 |
"L_mono": [
|
| 18 |
0.000488300864839623,
|
| 19 |
+
0.0005662547603071399,
|
| 20 |
+
0.0005689422242567437
|
| 21 |
],
|
| 22 |
"ret_loss": [
|
| 23 |
+
0.0,
|
| 24 |
0.0,
|
| 25 |
0.0
|
| 26 |
],
|
| 27 |
"ppl": [
|
| 28 |
3565.3611632608254,
|
| 29 |
+
337.54682195459276,
|
| 30 |
+
91.64535149630018
|
| 31 |
],
|
| 32 |
"tf_acc": [
|
| 33 |
0.4297560097089016,
|
| 34 |
+
0.4887341592392626,
|
| 35 |
+
0.5010944550332145
|
| 36 |
],
|
| 37 |
"fr_acc": [
|
| 38 |
0.0862397060965078,
|
| 39 |
+
0.1707139777687095,
|
| 40 |
+
0.11576797712301375
|
| 41 |
],
|
| 42 |
"def_rate": [
|
| 43 |
+
1.0,
|
| 44 |
1.0,
|
| 45 |
1.0
|
| 46 |
],
|
| 47 |
"mrr": [
|
| 48 |
0.00940620992332697,
|
| 49 |
+
0.010582948103547096,
|
| 50 |
+
0.010786919854581356
|
| 51 |
],
|
| 52 |
"r1": [
|
| 53 |
0.0010416667209938169,
|
| 54 |
+
0.0020833334419876337,
|
| 55 |
+
0.0010416667209938169
|
| 56 |
],
|
| 57 |
"ret_ok_pct": [
|
| 58 |
+
0.0,
|
| 59 |
0.0,
|
| 60 |
0.0
|
| 61 |
],
|
| 62 |
"gn_field": [
|
| 63 |
1.637221244392973,
|
| 64 |
+
0.1569300211017782,
|
| 65 |
+
0.18608613897453655
|
| 66 |
],
|
| 67 |
"gn_gfpd": [
|
| 68 |
296675.0374047661,
|
| 69 |
+
0.12336013482375578,
|
| 70 |
+
0.13450139917207488
|
| 71 |
],
|
| 72 |
"eta_mu": [
|
| 73 |
0.018591582775115967,
|
| 74 |
+
0.020370446145534515,
|
| 75 |
+
0.023813309147953987
|
| 76 |
],
|
| 77 |
"eta_h": [
|
| 78 |
0.21234284341335297,
|
| 79 |
+
0.23142163455486298,
|
| 80 |
+
0.26711082458496094
|
| 81 |
],
|
| 82 |
"beta_mean": [
|
| 83 |
0.11307718604803085,
|
| 84 |
+
0.18666285276412964,
|
| 85 |
+
0.31345537304878235
|
| 86 |
],
|
| 87 |
"w_ret": [
|
| 88 |
+
0.0,
|
| 89 |
0.0,
|
| 90 |
0.0
|
| 91 |
]
|