Epoch 200 - 74.63% acc
Browse files- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0 +2 -2
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json +44 -4
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
-
- **Best Accuracy**: 74.
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
|
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
+
- **Best Accuracy**: 74.63%
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 183271432
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f80ec79712bbf2e5e822f6284590dd7812b157dcae8301a878f4dd2c0ab6ec6
|
| 3 |
size 183271432
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce30eb306dcb5d3427da93a357a2f389214ef5cbaa2faba45ddcb585926cbdd2
|
| 3 |
+
size 819254
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json
CHANGED
|
@@ -188,7 +188,17 @@
|
|
| 188 |
2.982011616306427,
|
| 189 |
2.8773136229087144,
|
| 190 |
2.881724190177062,
|
| 191 |
-
2.9527760760906414
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 192 |
],
|
| 193 |
"ce": [
|
| 194 |
4.357172321661925,
|
|
@@ -379,7 +389,17 @@
|
|
| 379 |
1.4297002922265958,
|
| 380 |
1.4251254486349914,
|
| 381 |
1.5000684622770701,
|
| 382 |
-
1.486207452034339
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 383 |
],
|
| 384 |
"contrast": [
|
| 385 |
4.529944934600439,
|
|
@@ -570,7 +590,17 @@
|
|
| 570 |
1.5523113168967075,
|
| 571 |
1.4521881712170748,
|
| 572 |
1.3816557424190716,
|
| 573 |
-
1.4665686394923771
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 574 |
],
|
| 575 |
"lr": [
|
| 576 |
2.9999999999999997e-05,
|
|
@@ -761,6 +791,16 @@
|
|
| 761 |
1.5134556848374758e-06,
|
| 762 |
1.3286790323914947e-06,
|
| 763 |
1.1849114449367806e-06,
|
| 764 |
-
1.0821922270962664e-06
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 765 |
]
|
| 766 |
}
|
|
|
|
| 188 |
2.982011616306427,
|
| 189 |
2.8773136229087144,
|
| 190 |
2.881724190177062,
|
| 191 |
+
2.9527760760906414,
|
| 192 |
+
2.8433857324031684,
|
| 193 |
+
3.0805756553625447,
|
| 194 |
+
3.173988501460124,
|
| 195 |
+
3.150149035300964,
|
| 196 |
+
3.103418334860068,
|
| 197 |
+
2.8207061011057633,
|
| 198 |
+
3.148410226519291,
|
| 199 |
+
3.161121110809155,
|
| 200 |
+
2.8404618583428554,
|
| 201 |
+
2.9575896367048604
|
| 202 |
],
|
| 203 |
"ce": [
|
| 204 |
4.357172321661925,
|
|
|
|
| 389 |
1.4297002922265958,
|
| 390 |
1.4251254486349914,
|
| 391 |
1.5000684622770701,
|
| 392 |
+
1.486207452034339,
|
| 393 |
+
1.456172984188948,
|
| 394 |
+
1.5544836999514164,
|
| 395 |
+
1.5727642617928677,
|
| 396 |
+
1.527232175721572,
|
| 397 |
+
1.507080121835073,
|
| 398 |
+
1.3873552537117249,
|
| 399 |
+
1.4863953222066928,
|
| 400 |
+
1.5048485752863763,
|
| 401 |
+
1.44448418063231,
|
| 402 |
+
1.5417078345249862
|
| 403 |
],
|
| 404 |
"contrast": [
|
| 405 |
4.529944934600439,
|
|
|
|
| 590 |
1.5523113168967075,
|
| 591 |
1.4521881712170748,
|
| 592 |
1.3816557424190716,
|
| 593 |
+
1.4665686394923771,
|
| 594 |
+
1.387212754977055,
|
| 595 |
+
1.5260919726811923,
|
| 596 |
+
1.6012242632034497,
|
| 597 |
+
1.6229168613369649,
|
| 598 |
+
1.5963382177628003,
|
| 599 |
+
1.4333508509091841,
|
| 600 |
+
1.6620149140174572,
|
| 601 |
+
1.6562725476347484,
|
| 602 |
+
1.3959776806525694,
|
| 603 |
+
1.4158818163168736
|
| 604 |
],
|
| 605 |
"lr": [
|
| 606 |
2.9999999999999997e-05,
|
|
|
|
| 791 |
1.5134556848374758e-06,
|
| 792 |
1.3286790323914947e-06,
|
| 793 |
1.1849114449367806e-06,
|
| 794 |
+
1.0821922270962664e-06,
|
| 795 |
+
1.0205494612784436e-06,
|
| 796 |
+
1e-06,
|
| 797 |
+
1.0204359036258838e-06,
|
| 798 |
+
1.0817380275315555e-06,
|
| 799 |
+
1.1838896123284415e-06,
|
| 800 |
+
1.3268627307932066e-06,
|
| 801 |
+
1.5106182955028572e-06,
|
| 802 |
+
1.7351060695207923e-06,
|
| 803 |
+
2.00026468013108e-06,
|
| 804 |
+
2.306021635617207e-06
|
| 805 |
]
|
| 806 |
}
|