Epoch 190 - 74.62% acc
Browse files- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors +1 -1
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0 +2 -2
- weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json +44 -4
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/README.md
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
-
- **Best Accuracy**: 74.
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
|
|
|
| 1 |
# Run: run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740
|
| 2 |
|
| 3 |
## Results
|
| 4 |
+
- **Best Accuracy**: 74.62%
|
| 5 |
- **Dataset**: cifar100
|
| 6 |
- **Epochs**: 200
|
| 7 |
- **Model Version**: V2
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/best.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 183271432
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e9d43a39fca90bed1f741fef3744736e81fd2d71b8ec210de700b36b4d8cdc2
|
| 3 |
size 183271432
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/tensorboard/events.out.tfevents.1764539877.a14155bc494d.1798.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dac312f2a5772bca4a48885321eba83f0ba92418fba8b55eed25a7d519b98622
|
| 3 |
+
size 779030
|
weights/run_001_v2_5scale_2x2patch_alphamix_d512_8layer_16heads_16wormhole_20251130_215740/training_history.json
CHANGED
|
@@ -178,7 +178,17 @@
|
|
| 178 |
2.9907731959452994,
|
| 179 |
2.937100050541071,
|
| 180 |
3.030314071973165,
|
| 181 |
-
3.0131373691253174
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 182 |
],
|
| 183 |
"ce": [
|
| 184 |
4.357172321661925,
|
|
@@ -359,7 +369,17 @@
|
|
| 359 |
1.4935736950391378,
|
| 360 |
1.3842732094801389,
|
| 361 |
1.4957989322833525,
|
| 362 |
-
1.4497574080259372
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 363 |
],
|
| 364 |
"contrast": [
|
| 365 |
4.529944934600439,
|
|
@@ -540,7 +560,17 @@
|
|
| 540 |
1.4971995182144335,
|
| 541 |
1.5528268475563098,
|
| 542 |
1.534515163760919,
|
| 543 |
-
1.5633799798977681
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 544 |
],
|
| 545 |
"lr": [
|
| 546 |
2.9999999999999997e-05,
|
|
@@ -721,6 +751,16 @@
|
|
| 721 |
5.600080585004683e-06,
|
| 722 |
5.009832304169187e-06,
|
| 723 |
4.459586697776543e-06,
|
| 724 |
-
3.9494941974813935e-06
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 725 |
]
|
| 726 |
}
|
|
|
|
| 178 |
2.9907731959452994,
|
| 179 |
2.937100050541071,
|
| 180 |
3.030314071973165,
|
| 181 |
+
3.0131373691253174,
|
| 182 |
+
2.9583037671370382,
|
| 183 |
+
2.9715089440345763,
|
| 184 |
+
2.9340077991668996,
|
| 185 |
+
3.0631991940431105,
|
| 186 |
+
2.9617994571343447,
|
| 187 |
+
2.760121491398567,
|
| 188 |
+
2.982011616306427,
|
| 189 |
+
2.8773136229087144,
|
| 190 |
+
2.881724190177062,
|
| 191 |
+
2.9527760760906414
|
| 192 |
],
|
| 193 |
"ce": [
|
| 194 |
4.357172321661925,
|
|
|
|
| 369 |
1.4935736950391378,
|
| 370 |
1.3842732094801389,
|
| 371 |
1.4957989322833525,
|
| 372 |
+
1.4497574080259372,
|
| 373 |
+
1.4653237798657173,
|
| 374 |
+
1.4758108348036423,
|
| 375 |
+
1.5036061962827658,
|
| 376 |
+
1.4942389322397036,
|
| 377 |
+
1.4049325407315523,
|
| 378 |
+
1.4017816019745974,
|
| 379 |
+
1.4297002922265958,
|
| 380 |
+
1.4251254486349914,
|
| 381 |
+
1.5000684622770701,
|
| 382 |
+
1.486207452034339
|
| 383 |
],
|
| 384 |
"contrast": [
|
| 385 |
4.529944934600439,
|
|
|
|
| 560 |
1.4971995182144335,
|
| 561 |
1.5528268475563098,
|
| 562 |
1.534515163760919,
|
| 563 |
+
1.5633799798977681,
|
| 564 |
+
1.4929800024399391,
|
| 565 |
+
1.4956981138541148,
|
| 566 |
+
1.4304016046034984,
|
| 567 |
+
1.5689602623765284,
|
| 568 |
+
1.5568669258019863,
|
| 569 |
+
1.358339895804723,
|
| 570 |
+
1.5523113168967075,
|
| 571 |
+
1.4521881712170748,
|
| 572 |
+
1.3816557424190716,
|
| 573 |
+
1.4665686394923771
|
| 574 |
],
|
| 575 |
"lr": [
|
| 576 |
2.9999999999999997e-05,
|
|
|
|
| 751 |
5.600080585004683e-06,
|
| 752 |
5.009832304169187e-06,
|
| 753 |
4.459586697776543e-06,
|
| 754 |
+
3.9494941974813935e-06,
|
| 755 |
+
3.47969425748007e-06,
|
| 756 |
+
3.0503153163852546e-06,
|
| 757 |
+
2.6614747621120904e-06,
|
| 758 |
+
2.3132788997856054e-06,
|
| 759 |
+
2.0058229226778206e-06,
|
| 760 |
+
1.7391908861829483e-06,
|
| 761 |
+
1.5134556848374758e-06,
|
| 762 |
+
1.3286790323914947e-06,
|
| 763 |
+
1.1849114449367806e-06,
|
| 764 |
+
1.0821922270962664e-06
|
| 765 |
]
|
| 766 |
}
|