Update training_history.json - Run 20251104_144102
Browse files
weights/David-decoupled-cantor_scale/20251104_144102/training_history.json
CHANGED
|
@@ -2,68 +2,81 @@
|
|
| 2 |
"epochs": [
|
| 3 |
1,
|
| 4 |
2,
|
| 5 |
-
3
|
|
|
|
| 6 |
],
|
| 7 |
"train_loss": [
|
| 8 |
1.8473644912409581,
|
| 9 |
1.2349187319534949,
|
| 10 |
-
1.0967776605571407
|
|
|
|
| 11 |
],
|
| 12 |
"train_acc": [
|
| 13 |
83.50909756495444,
|
| 14 |
87.53558279287556,
|
| 15 |
-
88.92135061237137
|
|
|
|
| 16 |
],
|
| 17 |
"val_acc": [
|
| 18 |
84.296,
|
| 19 |
84.784,
|
| 20 |
-
85.094
|
|
|
|
| 21 |
],
|
| 22 |
"scale_accs": {
|
| 23 |
"384": [
|
| 24 |
82.254,
|
| 25 |
83.082,
|
| 26 |
-
83.518
|
|
|
|
| 27 |
],
|
| 28 |
"512": [
|
| 29 |
82.682,
|
| 30 |
83.472,
|
| 31 |
-
84.012
|
|
|
|
| 32 |
],
|
| 33 |
"768": [
|
| 34 |
83.39,
|
| 35 |
84.056,
|
| 36 |
-
84.434
|
|
|
|
| 37 |
],
|
| 38 |
"1024": [
|
| 39 |
83.314,
|
| 40 |
83.934,
|
| 41 |
-
84.376
|
|
|
|
| 42 |
],
|
| 43 |
"1280": [
|
| 44 |
83.256,
|
| 45 |
83.656,
|
| 46 |
-
84.022
|
|
|
|
| 47 |
],
|
| 48 |
"1536": [
|
| 49 |
83.196,
|
| 50 |
83.854,
|
| 51 |
-
84.16
|
|
|
|
| 52 |
],
|
| 53 |
"1792": [
|
| 54 |
83.188,
|
| 55 |
83.842,
|
| 56 |
-
84.126
|
|
|
|
| 57 |
],
|
| 58 |
"2048": [
|
| 59 |
83.254,
|
| 60 |
84.048,
|
| 61 |
-
84.176
|
|
|
|
| 62 |
]
|
| 63 |
},
|
| 64 |
"lr": [
|
| 65 |
0.0009755527298894294,
|
| 66 |
0.0009046039886902864,
|
| 67 |
-
0.0007940987335200904
|
|
|
|
| 68 |
]
|
| 69 |
}
|
|
|
|
| 2 |
"epochs": [
|
| 3 |
1,
|
| 4 |
2,
|
| 5 |
+
3,
|
| 6 |
+
4
|
| 7 |
],
|
| 8 |
"train_loss": [
|
| 9 |
1.8473644912409581,
|
| 10 |
1.2349187319534949,
|
| 11 |
+
1.0967776605571407,
|
| 12 |
+
0.9883316958422095
|
| 13 |
],
|
| 14 |
"train_acc": [
|
| 15 |
83.50909756495444,
|
| 16 |
87.53558279287556,
|
| 17 |
+
88.92135061237137,
|
| 18 |
+
90.1239260767722
|
| 19 |
],
|
| 20 |
"val_acc": [
|
| 21 |
84.296,
|
| 22 |
84.784,
|
| 23 |
+
85.094,
|
| 24 |
+
85.114
|
| 25 |
],
|
| 26 |
"scale_accs": {
|
| 27 |
"384": [
|
| 28 |
82.254,
|
| 29 |
83.082,
|
| 30 |
+
83.518,
|
| 31 |
+
83.574
|
| 32 |
],
|
| 33 |
"512": [
|
| 34 |
82.682,
|
| 35 |
83.472,
|
| 36 |
+
84.012,
|
| 37 |
+
84.268
|
| 38 |
],
|
| 39 |
"768": [
|
| 40 |
83.39,
|
| 41 |
84.056,
|
| 42 |
+
84.434,
|
| 43 |
+
84.538
|
| 44 |
],
|
| 45 |
"1024": [
|
| 46 |
83.314,
|
| 47 |
83.934,
|
| 48 |
+
84.376,
|
| 49 |
+
84.428
|
| 50 |
],
|
| 51 |
"1280": [
|
| 52 |
83.256,
|
| 53 |
83.656,
|
| 54 |
+
84.022,
|
| 55 |
+
84.308
|
| 56 |
],
|
| 57 |
"1536": [
|
| 58 |
83.196,
|
| 59 |
83.854,
|
| 60 |
+
84.16,
|
| 61 |
+
84.14
|
| 62 |
],
|
| 63 |
"1792": [
|
| 64 |
83.188,
|
| 65 |
83.842,
|
| 66 |
+
84.126,
|
| 67 |
+
83.91
|
| 68 |
],
|
| 69 |
"2048": [
|
| 70 |
83.254,
|
| 71 |
84.048,
|
| 72 |
+
84.176,
|
| 73 |
+
84.008
|
| 74 |
]
|
| 75 |
},
|
| 76 |
"lr": [
|
| 77 |
0.0009755527298894294,
|
| 78 |
0.0009046039886902864,
|
| 79 |
+
0.0007940987335200904,
|
| 80 |
+
0.0006548539886902864
|
| 81 |
]
|
| 82 |
}
|