AbstractPhil commited on
Commit
3525fa1
·
verified ·
1 Parent(s): b3ce89f

Epoch 0 - Test Acc: 0.6363

Browse files
weights/107cee49/best_107cee49.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2d6be94bf2beb224ea752846d40bd6ebfc17cc07e055bd50692582119b30169
3
+ size 535260
weights/107cee49/best_107cee49_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:534b7da84468d22dea04896749435bb7cf8345a31f20289505fe6bd2b7974b8d
3
+ size 1089611
weights/107cee49/best_af6ec6b0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dacc3e9ad838e89a4e9392e3f91aac6bdd729fc8e12f62f99e737bd4fe1a08b6
3
+ size 8031724
weights/107cee49/best_af6ec6b0_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1aa4f1fbf11e294277f14300a8199086509b1e6390742eb23ccd91906364cae
3
+ size 16070603
weights/107cee49/best_bb16ab15.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
3
+ size 3451276
weights/107cee49/best_bb16ab15_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b746cd0be7cabb9e6c0d438ae36e6ee0f06b07d9fa51f6a7867e444eb9c6ca79
3
+ size 6910091
weights/107cee49/best_c249e4ea.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
3
+ size 2511412
weights/107cee49/best_c249e4ea_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57977084aad393d3107d16fd2183e4d38ecee42a63d228a6322693ddc0e0e9c4
3
+ size 5030347
weights/107cee49/best_da2075c0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
3
+ size 3451276
weights/107cee49/best_da2075c0_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c50b1a4ef47d7ffda735d4e0a68e96129bbf829bc964315f8d11911c99933b62
3
+ size 6910091
weights/107cee49/checkpoint_bb16ab15_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a234cb25fd9db89d00a4af1fb7e0effb6092bb186beeb03ec956c24f1d61f84
3
+ size 3451276
weights/107cee49/checkpoint_bb16ab15_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f7f467f13b509840539e797982c71aecda261da36dbad46cdde9fa5f7fa4a9
3
+ size 6911787
weights/107cee49/checkpoint_c249e4ea_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8eae840bde63ef7eec48123d035c4263a45b5919263e20bd674af8dd4be60e4
3
+ size 2511412
weights/107cee49/checkpoint_c249e4ea_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eed28995d7590522d2398ea2b223c6b2de7d9e44a992bf297bac04f5906e2f1
3
+ size 5032107
weights/107cee49/checkpoint_da2075c0_epoch_004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af8f3b073dd14fda51166b9f0e4e268cd04b54a39b49f27bfd210ebd77c15b5
3
+ size 3451276
weights/107cee49/checkpoint_da2075c0_epoch_004_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f454295010a29fdd54dad59629458cdf6514227e6e6c901e21ae5de57982fa6
3
+ size 6911787
weights/107cee49/config_107cee49.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 32,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "107cee49",
12
+ "timestamp": "20250927_201412"
13
+ }
weights/107cee49/config_3a285e2e.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "3a285e2e",
12
+ "timestamp": "20250927_200947"
13
+ }
weights/107cee49/config_af6ec6b0.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 784,
4
+ "batch_size": 1024,
5
+ "epochs": 50,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "af6ec6b0",
12
+ "timestamp": "20250927_194146"
13
+ }
weights/107cee49/config_bb16ab15.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 256,
4
+ "batch_size": 1024,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "bb16ab15",
12
+ "timestamp": "20250927_195352"
13
+ }
weights/107cee49/config_c249e4ea.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 1024,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "c249e4ea",
12
+ "timestamp": "20250927_194324"
13
+ }
weights/107cee49/config_c42920db.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 32,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "c42920db",
12
+ "timestamp": "20250927_201340"
13
+ }
weights/107cee49/config_ccafe6f9.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "ccafe6f9",
12
+ "timestamp": "20250927_201234"
13
+ }
weights/107cee49/config_cd384834.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 64,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "cd384834",
12
+ "timestamp": "20250927_201249"
13
+ }
weights/107cee49/config_da2075c0.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_dim": 784,
3
+ "base_dim": 256,
4
+ "batch_size": 2048,
5
+ "epochs": 5,
6
+ "initial_lr": 0.001,
7
+ "temp_contrastive": 0.1,
8
+ "lambda_contrastive": 0.5,
9
+ "lambda_cayley": 0.01,
10
+ "dataset": "EMNIST_byclass",
11
+ "run_hash": "da2075c0",
12
+ "timestamp": "20250927_200116"
13
+ }