Commit
·
a41c411
1
Parent(s):
32fde3f
ViT GQA
Browse files- checkpoints_vit_gqa/epoch_100_end/meta.json +10 -0
- checkpoints_vit_gqa/epoch_100_end/model.pth +3 -0
- checkpoints_vit_gqa/epoch_100_end/optimizer.pth +3 -0
- checkpoints_vit_gqa/epoch_100_end/scaler.pth +3 -0
- checkpoints_vit_gqa/epoch_100_end/scheduler.pth +3 -0
- checkpoints_vit_gqa/epoch_50_end/meta.json +10 -0
- checkpoints_vit_gqa/epoch_50_end/model.pth +3 -0
- checkpoints_vit_gqa/epoch_50_end/optimizer.pth +3 -0
- checkpoints_vit_gqa/epoch_50_end/scaler.pth +3 -0
- checkpoints_vit_gqa/epoch_50_end/scheduler.pth +3 -0
checkpoints_vit_gqa/epoch_100_end/meta.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"epoch": 100,
|
| 3 |
+
"step": 195,
|
| 4 |
+
"train_loss": 0.2681627121543884,
|
| 5 |
+
"train_acc": 92.869,
|
| 6 |
+
"val_loss": 3.072373919677734,
|
| 7 |
+
"val_acc": 46.17,
|
| 8 |
+
"lr": 0.0002807397082996218,
|
| 9 |
+
"timestamp": "2025-11-16T01:47:23.199944"
|
| 10 |
+
}
|
checkpoints_vit_gqa/epoch_100_end/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d25af364a150d7af7c88bc6f284b625299965da6b6b527b8b2a1faa93fe69ce
|
| 3 |
+
size 305966291
|
checkpoints_vit_gqa/epoch_100_end/optimizer.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf5b166ef2ef210f2991c6dda658b360dd0442ffece1240442a059c8a57bcbc8
|
| 3 |
+
size 610744011
|
checkpoints_vit_gqa/epoch_100_end/scaler.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:100a5164efdf6285dac14d16444d2d4c2cebb12bf4cfd32631ad60a1f2c79bec
|
| 3 |
+
size 1383
|
checkpoints_vit_gqa/epoch_100_end/scheduler.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16c3765c4609ed023f9c075fdcf273e2f5f33cb31c3950b2c78d043053777d05
|
| 3 |
+
size 1721
|
checkpoints_vit_gqa/epoch_50_end/meta.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"epoch": 50,
|
| 3 |
+
"step": 195,
|
| 4 |
+
"train_loss": 1.7981066999053954,
|
| 5 |
+
"train_acc": 54.975,
|
| 6 |
+
"val_loss": 2.3799499137878417,
|
| 7 |
+
"val_acc": 44.56,
|
| 8 |
+
"lr": 0.00011876102844562934,
|
| 9 |
+
"timestamp": "2025-11-16T00:05:31.553502"
|
| 10 |
+
}
|
checkpoints_vit_gqa/epoch_50_end/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b3e14e69b3b14f43c87ce7542ca65ae78357c60ed764e8c0e6942353917fe46
|
| 3 |
+
size 305966291
|
checkpoints_vit_gqa/epoch_50_end/optimizer.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05f79dbc85a05bd1fb9207e7513ef9efc8e8178127fb40548739bbd5dc4bdd82
|
| 3 |
+
size 610744011
|
checkpoints_vit_gqa/epoch_50_end/scaler.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23fed54ea59e1797e4b789ebb513f51e7dee2396e3fd64774fc9149687165330
|
| 3 |
+
size 1383
|
checkpoints_vit_gqa/epoch_50_end/scheduler.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ecff30bd24e41f65aacf10e8a02fdb891dbb351617585790f564abdb81741b0
|
| 3 |
+
size 1721
|