Epoch 0 - Test Acc: 0.8050
Browse files- weights/6ddb8b71/best_107cee49.safetensors +3 -0
- weights/6ddb8b71/best_107cee49_state.pt +3 -0
- weights/6ddb8b71/best_6ddb8b71.safetensors +3 -0
- weights/6ddb8b71/best_6ddb8b71_state.pt +3 -0
- weights/6ddb8b71/best_af6ec6b0.safetensors +3 -0
- weights/6ddb8b71/best_af6ec6b0_state.pt +3 -0
- weights/6ddb8b71/best_bb16ab15.safetensors +3 -0
- weights/6ddb8b71/best_bb16ab15_state.pt +3 -0
- weights/6ddb8b71/best_c249e4ea.safetensors +3 -0
- weights/6ddb8b71/best_c249e4ea_state.pt +3 -0
- weights/6ddb8b71/best_da2075c0.safetensors +3 -0
- weights/6ddb8b71/best_da2075c0_state.pt +3 -0
- weights/6ddb8b71/checkpoint_107cee49_epoch_004.safetensors +3 -0
- weights/6ddb8b71/checkpoint_107cee49_epoch_004_state.pt +3 -0
- weights/6ddb8b71/checkpoint_bb16ab15_epoch_004.safetensors +3 -0
- weights/6ddb8b71/checkpoint_bb16ab15_epoch_004_state.pt +3 -0
- weights/6ddb8b71/checkpoint_c249e4ea_epoch_004.safetensors +3 -0
- weights/6ddb8b71/checkpoint_c249e4ea_epoch_004_state.pt +3 -0
- weights/6ddb8b71/checkpoint_da2075c0_epoch_004.safetensors +3 -0
- weights/6ddb8b71/checkpoint_da2075c0_epoch_004_state.pt +3 -0
- weights/6ddb8b71/config_107cee49.json +13 -0
- weights/6ddb8b71/config_3a285e2e.json +13 -0
- weights/6ddb8b71/config_6ddb8b71.json +13 -0
- weights/6ddb8b71/config_78df51aa.json +13 -0
- weights/6ddb8b71/config_af6ec6b0.json +13 -0
- weights/6ddb8b71/config_bb16ab15.json +13 -0
- weights/6ddb8b71/config_c249e4ea.json +13 -0
- weights/6ddb8b71/config_c42920db.json +13 -0
- weights/6ddb8b71/config_ccafe6f9.json +13 -0
- weights/6ddb8b71/config_cd384834.json +13 -0
- weights/6ddb8b71/config_da2075c0.json +13 -0
weights/6ddb8b71/best_107cee49.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7ebb7e5b0d0384d68847d94555a50e42000b8ede00d8bfc995544f1e4f19b15
|
| 3 |
+
size 535260
|
weights/6ddb8b71/best_107cee49_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fc50dce55d1bdd2865d44add7f8efa2c8b08aa5b70edca318afd1c7a10f9f03
|
| 3 |
+
size 1089611
|
weights/6ddb8b71/best_6ddb8b71.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d544dce434deac0ac69ffd1a00b2e6af69ffeaafbf5c9b9280599aba07e9077e
|
| 3 |
+
size 27483372
|
weights/6ddb8b71/best_6ddb8b71_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5bcb1cc20efc23097d5a36ea9ae1ea2b759214c367ca888e59e6073f677139f9
|
| 3 |
+
size 54985611
|
weights/6ddb8b71/best_af6ec6b0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dacc3e9ad838e89a4e9392e3f91aac6bdd729fc8e12f62f99e737bd4fe1a08b6
|
| 3 |
+
size 8031724
|
weights/6ddb8b71/best_af6ec6b0_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1aa4f1fbf11e294277f14300a8199086509b1e6390742eb23ccd91906364cae
|
| 3 |
+
size 16070603
|
weights/6ddb8b71/best_bb16ab15.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
|
| 3 |
+
size 3451276
|
weights/6ddb8b71/best_bb16ab15_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b746cd0be7cabb9e6c0d438ae36e6ee0f06b07d9fa51f6a7867e444eb9c6ca79
|
| 3 |
+
size 6910091
|
weights/6ddb8b71/best_c249e4ea.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
|
| 3 |
+
size 2511412
|
weights/6ddb8b71/best_c249e4ea_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57977084aad393d3107d16fd2183e4d38ecee42a63d228a6322693ddc0e0e9c4
|
| 3 |
+
size 5030347
|
weights/6ddb8b71/best_da2075c0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
|
| 3 |
+
size 3451276
|
weights/6ddb8b71/best_da2075c0_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c50b1a4ef47d7ffda735d4e0a68e96129bbf829bc964315f8d11911c99933b62
|
| 3 |
+
size 6910091
|
weights/6ddb8b71/checkpoint_107cee49_epoch_004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7ebb7e5b0d0384d68847d94555a50e42000b8ede00d8bfc995544f1e4f19b15
|
| 3 |
+
size 535260
|
weights/6ddb8b71/checkpoint_107cee49_epoch_004_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2f30ebbfcf599b9fc9d322ad482986c6d5fa4485cef94169f26e7c73a164f51
|
| 3 |
+
size 1091307
|
weights/6ddb8b71/checkpoint_bb16ab15_epoch_004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
|
| 3 |
+
size 3451276
|
weights/6ddb8b71/checkpoint_bb16ab15_epoch_004_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96f7f467f13b509840539e797982c71aecda261da36dbad46cdde9fa5f7fa4a9
|
| 3 |
+
size 6911787
|
weights/6ddb8b71/checkpoint_c249e4ea_epoch_004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
|
| 3 |
+
size 2511412
|
weights/6ddb8b71/checkpoint_c249e4ea_epoch_004_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3eed28995d7590522d2398ea2b223c6b2de7d9e44a992bf297bac04f5906e2f1
|
| 3 |
+
size 5032107
|
weights/6ddb8b71/checkpoint_da2075c0_epoch_004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
|
| 3 |
+
size 3451276
|
weights/6ddb8b71/checkpoint_da2075c0_epoch_004_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f454295010a29fdd54dad59629458cdf6514227e6e6c901e21ae5de57982fa6
|
| 3 |
+
size 6911787
|
weights/6ddb8b71/config_107cee49.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 32,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "107cee49",
|
| 12 |
+
"timestamp": "20250927_201412"
|
| 13 |
+
}
|
weights/6ddb8b71/config_3a285e2e.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 64,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "3a285e2e",
|
| 12 |
+
"timestamp": "20250927_200947"
|
| 13 |
+
}
|
weights/6ddb8b71/config_6ddb8b71.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 2048,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "6ddb8b71",
|
| 12 |
+
"timestamp": "20250927_201913"
|
| 13 |
+
}
|
weights/6ddb8b71/config_78df51aa.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 28,
|
| 3 |
+
"base_dim": 32,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "78df51aa",
|
| 12 |
+
"timestamp": "20250927_201849"
|
| 13 |
+
}
|
weights/6ddb8b71/config_af6ec6b0.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 784,
|
| 4 |
+
"batch_size": 1024,
|
| 5 |
+
"epochs": 50,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "af6ec6b0",
|
| 12 |
+
"timestamp": "20250927_194146"
|
| 13 |
+
}
|
weights/6ddb8b71/config_bb16ab15.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 256,
|
| 4 |
+
"batch_size": 1024,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "bb16ab15",
|
| 12 |
+
"timestamp": "20250927_195352"
|
| 13 |
+
}
|
weights/6ddb8b71/config_c249e4ea.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 64,
|
| 4 |
+
"batch_size": 1024,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "c249e4ea",
|
| 12 |
+
"timestamp": "20250927_194324"
|
| 13 |
+
}
|
weights/6ddb8b71/config_c42920db.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 32,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "c42920db",
|
| 12 |
+
"timestamp": "20250927_201340"
|
| 13 |
+
}
|
weights/6ddb8b71/config_ccafe6f9.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 64,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "ccafe6f9",
|
| 12 |
+
"timestamp": "20250927_201234"
|
| 13 |
+
}
|
weights/6ddb8b71/config_cd384834.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 64,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "cd384834",
|
| 12 |
+
"timestamp": "20250927_201249"
|
| 13 |
+
}
|
weights/6ddb8b71/config_da2075c0.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dim": 784,
|
| 3 |
+
"base_dim": 256,
|
| 4 |
+
"batch_size": 2048,
|
| 5 |
+
"epochs": 5,
|
| 6 |
+
"initial_lr": 0.001,
|
| 7 |
+
"temp_contrastive": 0.1,
|
| 8 |
+
"lambda_contrastive": 0.5,
|
| 9 |
+
"lambda_cayley": 0.01,
|
| 10 |
+
"dataset": "EMNIST_byclass",
|
| 11 |
+
"run_hash": "da2075c0",
|
| 12 |
+
"timestamp": "20250927_200116"
|
| 13 |
+
}
|