Epoch 170 - 74.54% acc
Browse files- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0 +2 -2
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json +44 -4
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
-
- **Best Accuracy**: 74.
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
|
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
+
- **Best Accuracy**: 74.54%
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 183271432
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:65e277bf19c1f66a51e23fba2f4c47fc7514b908ec244b07b393e36be7c8ace5
|
| 3 |
size 183271432
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:336a562e119b4c0f349deaba5684fdae33fe01ccaffc9da11a02ffaaa8b76a5c
|
| 3 |
+
size 696174
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json
CHANGED
|
@@ -158,7 +158,17 @@
|
|
| 158 |
2.7509551217158634,
|
| 159 |
2.9926886714421785,
|
| 160 |
2.918874252606661,
|
| 161 |
-
3.157657731496371
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 162 |
],
|
| 163 |
"ce": [
|
| 164 |
4.357172321661925,
|
|
@@ -319,7 +329,17 @@
|
|
| 319 |
1.3537852550928409,
|
| 320 |
1.4857026207141386,
|
| 321 |
1.4910478177361,
|
| 322 |
-
1.548207331658938
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 323 |
],
|
| 324 |
"contrast": [
|
| 325 |
4.529944934600439,
|
|
@@ -480,7 +500,17 @@
|
|
| 480 |
1.3971698715136602,
|
| 481 |
1.5069860436213323,
|
| 482 |
1.4278264485108547,
|
| 483 |
-
1.6094504208136828
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 484 |
],
|
| 485 |
"lr": [
|
| 486 |
2.9999999999999997e-05,
|
|
@@ -641,6 +671,16 @@
|
|
| 641 |
2.547888339314832e-05,
|
| 642 |
2.4136614190006112e-05,
|
| 643 |
2.282911859011891e-05,
|
| 644 |
-
2.155675404972841e-05
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 645 |
]
|
| 646 |
}
|
|
|
|
| 158 |
2.7509551217158634,
|
| 159 |
2.9926886714421785,
|
| 160 |
2.918874252606661,
|
| 161 |
+
3.157657731496371,
|
| 162 |
+
3.0912926761003643,
|
| 163 |
+
3.20725641418726,
|
| 164 |
+
2.853640123666861,
|
| 165 |
+
3.065764631369175,
|
| 166 |
+
2.9422709775276674,
|
| 167 |
+
2.8492555040579575,
|
| 168 |
+
2.861172367517765,
|
| 169 |
+
2.7437335413235884,
|
| 170 |
+
3.0545060781332163,
|
| 171 |
+
3.0605580884676713
|
| 172 |
],
|
| 173 |
"ce": [
|
| 174 |
4.357172321661925,
|
|
|
|
| 329 |
1.3537852550928409,
|
| 330 |
1.4857026207141386,
|
| 331 |
1.4910478177361,
|
| 332 |
+
1.548207331658938,
|
| 333 |
+
1.4566624997518,
|
| 334 |
+
1.5562550109166366,
|
| 335 |
+
1.429246907432874,
|
| 336 |
+
1.5497427979723002,
|
| 337 |
+
1.457532100379467,
|
| 338 |
+
1.4270203954134233,
|
| 339 |
+
1.4064926836353082,
|
| 340 |
+
1.3590744248567483,
|
| 341 |
+
1.4778487952473836,
|
| 342 |
+
1.4917722631723453
|
| 343 |
],
|
| 344 |
"contrast": [
|
| 345 |
4.529944934600439,
|
|
|
|
| 500 |
1.3971698715136602,
|
| 501 |
1.5069860436213323,
|
| 502 |
1.4278264485108547,
|
| 503 |
+
1.6094504208136828,
|
| 504 |
+
1.634630188651574,
|
| 505 |
+
1.6510014061744396,
|
| 506 |
+
1.4243932255567648,
|
| 507 |
+
1.5160218374851422,
|
| 508 |
+
1.4847388852865269,
|
| 509 |
+
1.4222351142229177,
|
| 510 |
+
1.454679709749344,
|
| 511 |
+
1.3846591322085797,
|
| 512 |
+
1.5766573063074014,
|
| 513 |
+
1.5687858427182222
|
| 514 |
],
|
| 515 |
"lr": [
|
| 516 |
2.9999999999999997e-05,
|
|
|
|
| 671 |
2.547888339314832e-05,
|
| 672 |
2.4136614190006112e-05,
|
| 673 |
2.282911859011891e-05,
|
| 674 |
+
2.155675404972841e-05,
|
| 675 |
+
2.0319868420595586e-05,
|
| 676 |
+
1.9118799854901143e-05,
|
| 677 |
+
1.7953876712798343e-05,
|
| 678 |
+
1.6825417472642582e-05,
|
| 679 |
+
1.5733730643922538e-05,
|
| 680 |
+
1.4679114682916717e-05,
|
| 681 |
+
1.3661857911098582e-05,
|
| 682 |
+
1.2682238436312296e-05,
|
| 683 |
+
1.1740524076740871e-05,
|
| 684 |
+
1.0836972287687232e-05
|
| 685 |
]
|
| 686 |
}
|