AbstractPhil commited on
Commit
b02ac61
·
verified ·
1 Parent(s): 4975f22

Epoch 0 - Test Acc: 0.8050

Browse files
Files changed (31) hide show
  1. weights/6ddb8b71/best_107cee49.safetensors +3 -0
  2. weights/6ddb8b71/best_107cee49_state.pt +3 -0
  3. weights/6ddb8b71/best_6ddb8b71.safetensors +3 -0
  4. weights/6ddb8b71/best_6ddb8b71_state.pt +3 -0
  5. weights/6ddb8b71/best_af6ec6b0.safetensors +3 -0
  6. weights/6ddb8b71/best_af6ec6b0_state.pt +3 -0
  7. weights/6ddb8b71/best_bb16ab15.safetensors +3 -0
  8. weights/6ddb8b71/best_bb16ab15_state.pt +3 -0
  9. weights/6ddb8b71/best_c249e4ea.safetensors +3 -0
  10. weights/6ddb8b71/best_c249e4ea_state.pt +3 -0
  11. weights/6ddb8b71/best_da2075c0.safetensors +3 -0
  12. weights/6ddb8b71/best_da2075c0_state.pt +3 -0
  13. weights/6ddb8b71/checkpoint_107cee49_epoch_004.safetensors +3 -0
  14. weights/6ddb8b71/checkpoint_107cee49_epoch_004_state.pt +3 -0
  15. weights/6ddb8b71/checkpoint_bb16ab15_epoch_004.safetensors +3 -0
  16. weights/6ddb8b71/checkpoint_bb16ab15_epoch_004_state.pt +3 -0
  17. weights/6ddb8b71/checkpoint_c249e4ea_epoch_004.safetensors +3 -0
  18. weights/6ddb8b71/checkpoint_c249e4ea_epoch_004_state.pt +3 -0
  19. weights/6ddb8b71/checkpoint_da2075c0_epoch_004.safetensors +3 -0
  20. weights/6ddb8b71/checkpoint_da2075c0_epoch_004_state.pt +3 -0
  21. weights/6ddb8b71/config_107cee49.json +13 -0
  22. weights/6ddb8b71/config_3a285e2e.json +13 -0
  23. weights/6ddb8b71/config_6ddb8b71.json +13 -0
  24. weights/6ddb8b71/config_78df51aa.json +13 -0
  25. weights/6ddb8b71/config_af6ec6b0.json +13 -0
  26. weights/6ddb8b71/config_bb16ab15.json +13 -0
  27. weights/6ddb8b71/config_c249e4ea.json +13 -0
  28. weights/6ddb8b71/config_c42920db.json +13 -0
  29. weights/6ddb8b71/config_ccafe6f9.json +13 -0
  30. weights/6ddb8b71/config_cd384834.json +13 -0
  31. weights/6ddb8b71/config_da2075c0.json +13 -0
weights/6ddb8b71/best_107cee49.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7ebb7e5b0d0384d68847d94555a50e42000b8ede00d8bfc995544f1e4f19b15
3
+ size 535260
weights/6ddb8b71/best_107cee49_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fc50dce55d1bdd2865d44add7f8efa2c8b08aa5b70edca318afd1c7a10f9f03
3
+ size 1089611
weights/6ddb8b71/best_6ddb8b71.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d544dce434deac0ac69ffd1a00b2e6af69ffeaafbf5c9b9280599aba07e9077e
3
+ size 27483372
weights/6ddb8b71/best_6ddb8b71_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bcb1cc20efc23097d5a36ea9ae1ea2b759214c367ca888e59e6073f677139f9
3
+ size 54985611
weights/6ddb8b71/best_af6ec6b0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dacc3e9ad838e89a4e9392e3f91aac6bdd729fc8e12f62f99e737bd4fe1a08b6
3
+ size 8031724
weights/6ddb8b71/best_af6ec6b0_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1aa4f1fbf11e294277f14300a8199086509b1e6390742eb23ccd91906364cae
3
+ size 16070603
weights/6ddb8b71/best_bb16ab15.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
3
+ size 3451276
weights/6ddb8b71/best_bb16ab15_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b746cd0be7cabb9e6c0d438ae36e6ee0f06b07d9fa51f6a7867e444eb9c6ca79
3
+ size 6910091
weights/6ddb8b71/best_c249e4ea.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
3
+ size 2511412
weights/6ddb8b71/best_c249e4ea_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57977084aad393d3107d16fd2183e4d38ecee42a63d228a6322693ddc0e0e9c4
3
+ size 5030347
weights/6ddb8b71/best_da2075c0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
3
+ size 3451276
weights/6ddb8b71/best_da2075c0_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c50b1a4ef47d7ffda735d4e0a68e96129bbf829bc964315f8d11911c99933b62
3
+ size 6910091
weights/6ddb8b71/checkpoint_107cee49_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7ebb7e5b0d0384d68847d94555a50e42000b8ede00d8bfc995544f1e4f19b15
3
+ size 535260
weights/6ddb8b71/checkpoint_107cee49_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f30ebbfcf599b9fc9d322ad482986c6d5fa4485cef94169f26e7c73a164f51
3
+ size 1091307
weights/6ddb8b71/checkpoint_bb16ab15_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
3
+ size 3451276
weights/6ddb8b71/checkpoint_bb16ab15_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f7f467f13b509840539e797982c71aecda261da36dbad46cdde9fa5f7fa4a9
3
+ size 6911787
weights/6ddb8b71/checkpoint_c249e4ea_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
3
+ size 2511412
weights/6ddb8b71/checkpoint_c249e4ea_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eed28995d7590522d2398ea2b223c6b2de7d9e44a992bf297bac04f5906e2f1
3
+ size 5032107
weights/6ddb8b71/checkpoint_da2075c0_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
3
+ size 3451276
weights/6ddb8b71/checkpoint_da2075c0_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f454295010a29fdd54dad59629458cdf6514227e6e6c901e21ae5de57982fa6
3
+ size 6911787
weights/6ddb8b71/config_107cee49.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 32,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "107cee49",
12
+ "timestamp": "20250927_201412"
13
+ }
weights/6ddb8b71/config_3a285e2e.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "3a285e2e",
12
+ "timestamp": "20250927_200947"
13
+ }
weights/6ddb8b71/config_6ddb8b71.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 2048,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "6ddb8b71",
12
+ "timestamp": "20250927_201913"
13
+ }
weights/6ddb8b71/config_78df51aa.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 28,
3
+ "base_dim": 32,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "78df51aa",
12
+ "timestamp": "20250927_201849"
13
+ }
weights/6ddb8b71/config_af6ec6b0.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 784,
4
+ "batch_size": 1024,
5
+ "epochs": 50,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "af6ec6b0",
12
+ "timestamp": "20250927_194146"
13
+ }
weights/6ddb8b71/config_bb16ab15.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 256,
4
+ "batch_size": 1024,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "bb16ab15",
12
+ "timestamp": "20250927_195352"
13
+ }
weights/6ddb8b71/config_c249e4ea.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 1024,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "c249e4ea",
12
+ "timestamp": "20250927_194324"
13
+ }
weights/6ddb8b71/config_c42920db.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 32,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "c42920db",
12
+ "timestamp": "20250927_201340"
13
+ }
weights/6ddb8b71/config_ccafe6f9.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "ccafe6f9",
12
+ "timestamp": "20250927_201234"
13
+ }
weights/6ddb8b71/config_cd384834.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "cd384834",
12
+ "timestamp": "20250927_201249"
13
+ }
weights/6ddb8b71/config_da2075c0.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 256,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "da2075c0",
12
+ "timestamp": "20250927_200116"
13
+ }