RuidiChang commited on
Commit
64dd0f7
·
verified ·
1 Parent(s): b015cf3

Sync missing vs SOURCE into TARGET under 'checkpoints' (batch 5, +50 files)

Browse files
Files changed (50) hide show
  1. checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.pt +3 -0
  2. checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.txt +12 -0
  3. checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_before_new.txt +2 -0
  4. checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_new.txt +2 -0
  5. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/config.txt +6 -0
  6. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.pt +3 -0
  7. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.txt +32 -0
  8. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics.txt +2 -0
  9. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics_before.txt +2 -0
  10. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup/config.txt +6 -0
  11. checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup/config.txt +6 -0
  12. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/config.txt +6 -0
  13. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.pt +3 -0
  14. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.txt +32 -0
  15. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics.txt +2 -0
  16. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics_before.txt +2 -0
  17. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup/config.txt +6 -0
  18. checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup/config.txt +6 -0
  19. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/config.txt +6 -0
  20. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.pt +3 -0
  21. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.txt +32 -0
  22. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics.txt +2 -0
  23. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics_before.txt +2 -0
  24. checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup/config.txt +6 -0
  25. checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/config.txt +6 -0
  26. checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.pt +3 -0
  27. checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.txt +32 -0
  28. checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics.txt +2 -0
  29. checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics_before.txt +2 -0
  30. checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/config.txt +6 -0
  31. checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.pt +3 -0
  32. checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.txt +32 -0
  33. checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics.txt +2 -0
  34. checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics_before.txt +2 -0
  35. checkpoints/residual_beta_clutrr_llama_train_correct_0/config.txt +6 -0
  36. checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.pt +3 -0
  37. checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.txt +32 -0
  38. checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics.txt +2 -0
  39. checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics_before.txt +2 -0
  40. checkpoints/residual_beta_clutrr_llama_train_correct_1/config.txt +6 -0
  41. checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.pt +3 -0
  42. checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.txt +32 -0
  43. checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics.txt +2 -0
  44. checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics_before.txt +2 -0
  45. checkpoints/residual_beta_clutrr_llama_train_correct_2/config.txt +6 -0
  46. checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.pt +3 -0
  47. checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.txt +32 -0
  48. checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics.txt +2 -0
  49. checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics_before.txt +2 -0
  50. checkpoints/residual_beta_clutrr_llama_train_correct_3/config.txt +6 -0
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a49cd7851544a295dcd0158056c68f37e96c890a72d06bbb575deb36bc6add63
3
+ size 1220
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.txt ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 0.999653
2
+ Layer 1: 1.000033
3
+ Layer 2: 1.000485
4
+ Layer 3: 1.000472
5
+ Layer 4: 1.000640
6
+ Layer 5: 1.000615
7
+ Layer 6: 1.000651
8
+ Layer 7: 0.999653
9
+ Layer 8: 0.999722
10
+ Layer 9: 0.999756
11
+ Layer 10: 0.999356
12
+ Layer 11: 1.000359
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_before_new.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0287
2
+ Test Accuracy: 0.9868
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_new.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0287
2
+ Test Accuracy: 0.9868
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9aa06dfc1284e02e2e7728e6b995c26b83e397fd4d5daee0451f4bfc3d4e29a
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000076
2
+ Layer 1: 0.999903
3
+ Layer 2: 1.000117
4
+ Layer 3: 1.000051
5
+ Layer 4: 1.000268
6
+ Layer 5: 0.999983
7
+ Layer 6: 0.999930
8
+ Layer 7: 0.999788
9
+ Layer 8: 0.999786
10
+ Layer 9: 0.999840
11
+ Layer 10: 1.000265
12
+ Layer 11: 0.999614
13
+ Layer 12: 0.999760
14
+ Layer 13: 0.999672
15
+ Layer 14: 1.000397
16
+ Layer 15: 1.000151
17
+ Layer 16: 0.999691
18
+ Layer 17: 0.999929
19
+ Layer 18: 1.000166
20
+ Layer 19: 0.999558
21
+ Layer 20: 1.000380
22
+ Layer 21: 1.000044
23
+ Layer 22: 0.999544
24
+ Layer 23: 1.000252
25
+ Layer 24: 1.000250
26
+ Layer 25: 0.999792
27
+ Layer 26: 1.000169
28
+ Layer 27: 0.999551
29
+ Layer 28: 1.000153
30
+ Layer 29: 1.000162
31
+ Layer 30: 1.000268
32
+ Layer 31: 1.000337
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1291
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1332
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/clutrr_llama/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45f03c6fb18352fe0f2a676974d31d079e74a074eb451d7b48633112093c782
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000057
2
+ Layer 1: 0.999892
3
+ Layer 2: 1.000131
4
+ Layer 3: 1.000091
5
+ Layer 4: 1.000279
6
+ Layer 5: 0.999976
7
+ Layer 6: 0.999942
8
+ Layer 7: 0.999838
9
+ Layer 8: 0.999756
10
+ Layer 9: 0.999839
11
+ Layer 10: 1.000284
12
+ Layer 11: 0.999585
13
+ Layer 12: 0.999785
14
+ Layer 13: 0.999654
15
+ Layer 14: 1.000371
16
+ Layer 15: 1.000184
17
+ Layer 16: 0.999707
18
+ Layer 17: 0.999920
19
+ Layer 18: 1.000166
20
+ Layer 19: 0.999567
21
+ Layer 20: 1.000366
22
+ Layer 21: 1.000078
23
+ Layer 22: 0.999533
24
+ Layer 23: 1.000281
25
+ Layer 24: 1.000284
26
+ Layer 25: 0.999787
27
+ Layer 26: 1.000183
28
+ Layer 27: 0.999543
29
+ Layer 28: 1.000109
30
+ Layer 29: 1.000183
31
+ Layer 30: 1.000251
32
+ Layer 31: 1.000286
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1291
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1332
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/clutrr_llama/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_2
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38be78b41c49822a2ea338a85880daf6dbffff3cf4c2e625fa38b98c0562cff2
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000049
2
+ Layer 1: 0.999899
3
+ Layer 2: 1.000125
4
+ Layer 3: 1.000065
5
+ Layer 4: 1.000246
6
+ Layer 5: 1.000024
7
+ Layer 6: 0.999946
8
+ Layer 7: 0.999762
9
+ Layer 8: 0.999763
10
+ Layer 9: 0.999902
11
+ Layer 10: 1.000269
12
+ Layer 11: 0.999593
13
+ Layer 12: 0.999716
14
+ Layer 13: 0.999663
15
+ Layer 14: 1.000386
16
+ Layer 15: 1.000159
17
+ Layer 16: 0.999684
18
+ Layer 17: 0.999871
19
+ Layer 18: 1.000162
20
+ Layer 19: 0.999569
21
+ Layer 20: 1.000359
22
+ Layer 21: 1.000065
23
+ Layer 22: 0.999560
24
+ Layer 23: 1.000259
25
+ Layer 24: 1.000261
26
+ Layer 25: 0.999805
27
+ Layer 26: 1.000163
28
+ Layer 27: 0.999591
29
+ Layer 28: 1.000092
30
+ Layer 29: 1.000202
31
+ Layer 30: 1.000239
32
+ Layer 31: 1.000287
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1292
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1332
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 3
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_3
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37025576941bfc28183a87a9f943e3f91d68211ea9bb8632f0bbc5f1423a961e
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000044
2
+ Layer 1: 0.999919
3
+ Layer 2: 1.000139
4
+ Layer 3: 1.000065
5
+ Layer 4: 1.000301
6
+ Layer 5: 1.000002
7
+ Layer 6: 0.999924
8
+ Layer 7: 0.999817
9
+ Layer 8: 0.999759
10
+ Layer 9: 0.999882
11
+ Layer 10: 1.000232
12
+ Layer 11: 0.999656
13
+ Layer 12: 0.999739
14
+ Layer 13: 0.999704
15
+ Layer 14: 1.000372
16
+ Layer 15: 1.000132
17
+ Layer 16: 0.999701
18
+ Layer 17: 0.999889
19
+ Layer 18: 1.000138
20
+ Layer 19: 0.999565
21
+ Layer 20: 1.000427
22
+ Layer 21: 1.000082
23
+ Layer 22: 0.999549
24
+ Layer 23: 1.000314
25
+ Layer 24: 1.000259
26
+ Layer 25: 0.999759
27
+ Layer 26: 1.000139
28
+ Layer 27: 0.999559
29
+ Layer 28: 1.000105
30
+ Layer 29: 1.000153
31
+ Layer 30: 1.000232
32
+ Layer 31: 1.000292
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1292
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1332
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 42
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_42
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6847fcceea2ef09b014f6cdec124a5da538353a4bf654bf1a74f1848fd0fd98a
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000038
2
+ Layer 1: 0.999942
3
+ Layer 2: 1.000114
4
+ Layer 3: 1.000136
5
+ Layer 4: 1.000243
6
+ Layer 5: 1.000004
7
+ Layer 6: 0.999921
8
+ Layer 7: 0.999820
9
+ Layer 8: 0.999825
10
+ Layer 9: 0.999864
11
+ Layer 10: 1.000246
12
+ Layer 11: 0.999663
13
+ Layer 12: 0.999800
14
+ Layer 13: 0.999628
15
+ Layer 14: 1.000331
16
+ Layer 15: 1.000161
17
+ Layer 16: 0.999700
18
+ Layer 17: 0.999922
19
+ Layer 18: 1.000136
20
+ Layer 19: 0.999544
21
+ Layer 20: 1.000375
22
+ Layer 21: 1.000083
23
+ Layer 22: 0.999531
24
+ Layer 23: 1.000296
25
+ Layer 24: 1.000268
26
+ Layer 25: 0.999740
27
+ Layer 26: 1.000129
28
+ Layer 27: 0.999552
29
+ Layer 28: 1.000087
30
+ Layer 29: 1.000152
31
+ Layer 30: 1.000218
32
+ Layer 31: 1.000292
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1293
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 2.1332
2
+ Test Accuracy: 0.6358
checkpoints/residual_beta_clutrr_llama_train_correct_0/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_0
checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4fd60511989382bad3dd2d079448b464c20e588f75ee0bb90add31794121aa9
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.001698
2
+ Layer 1: 0.997893
3
+ Layer 2: 1.001930
4
+ Layer 3: 0.998901
5
+ Layer 4: 0.998956
6
+ Layer 5: 0.999694
7
+ Layer 6: 1.000498
8
+ Layer 7: 0.999588
9
+ Layer 8: 1.000236
10
+ Layer 9: 1.002018
11
+ Layer 10: 1.000320
12
+ Layer 11: 0.998410
13
+ Layer 12: 1.000116
14
+ Layer 13: 1.002069
15
+ Layer 14: 0.997052
16
+ Layer 15: 0.999062
17
+ Layer 16: 0.998260
18
+ Layer 17: 1.000410
19
+ Layer 18: 0.998667
20
+ Layer 19: 0.999585
21
+ Layer 20: 1.001028
22
+ Layer 21: 1.001209
23
+ Layer 22: 0.997678
24
+ Layer 23: 0.996642
25
+ Layer 24: 1.002759
26
+ Layer 25: 0.996454
27
+ Layer 26: 0.999449
28
+ Layer 27: 0.997274
29
+ Layer 28: 0.997749
30
+ Layer 29: 0.999731
31
+ Layer 30: 0.997755
32
+ Layer 31: 1.003472
checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0226
2
+ Test Accuracy: 0.9942
checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0236
2
+ Test Accuracy: 0.9940
checkpoints/residual_beta_clutrr_llama_train_correct_1/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_1
checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8689cc6cca13b75bd3cf6de8ae694e0750ae2a7cc766a1599e9aeaf52144c9f
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.001549
2
+ Layer 1: 0.997922
3
+ Layer 2: 1.001824
4
+ Layer 3: 0.998915
5
+ Layer 4: 0.998898
6
+ Layer 5: 0.999670
7
+ Layer 6: 1.000539
8
+ Layer 7: 0.999587
9
+ Layer 8: 1.000297
10
+ Layer 9: 1.002017
11
+ Layer 10: 1.000371
12
+ Layer 11: 0.998439
13
+ Layer 12: 1.000070
14
+ Layer 13: 1.002052
15
+ Layer 14: 0.997161
16
+ Layer 15: 0.999056
17
+ Layer 16: 0.998278
18
+ Layer 17: 1.000382
19
+ Layer 18: 0.998720
20
+ Layer 19: 0.999580
21
+ Layer 20: 1.001064
22
+ Layer 21: 1.001211
23
+ Layer 22: 0.997648
24
+ Layer 23: 0.996551
25
+ Layer 24: 1.002808
26
+ Layer 25: 0.996599
27
+ Layer 26: 0.999425
28
+ Layer 27: 0.997328
29
+ Layer 28: 0.997917
30
+ Layer 29: 0.999739
31
+ Layer 30: 0.997880
32
+ Layer 31: 1.003539
checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0227
2
+ Test Accuracy: 0.9942
checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0236
2
+ Test Accuracy: 0.9940
checkpoints/residual_beta_clutrr_llama_train_correct_2/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_2
checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f5201d946ab22599688df17dff73fd79a6fd3f457887d7c94107bdd88a3be9f
3
+ size 1648
checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.001709
2
+ Layer 1: 0.997907
3
+ Layer 2: 1.001903
4
+ Layer 3: 0.998951
5
+ Layer 4: 0.998942
6
+ Layer 5: 0.999700
7
+ Layer 6: 1.000541
8
+ Layer 7: 0.999545
9
+ Layer 8: 1.000248
10
+ Layer 9: 1.002025
11
+ Layer 10: 1.000368
12
+ Layer 11: 0.998406
13
+ Layer 12: 0.999990
14
+ Layer 13: 1.002042
15
+ Layer 14: 0.997180
16
+ Layer 15: 0.999018
17
+ Layer 16: 0.998291
18
+ Layer 17: 1.000450
19
+ Layer 18: 0.998765
20
+ Layer 19: 0.999521
21
+ Layer 20: 1.000991
22
+ Layer 21: 1.001229
23
+ Layer 22: 0.997614
24
+ Layer 23: 0.996626
25
+ Layer 24: 1.002810
26
+ Layer 25: 0.996541
27
+ Layer 26: 0.999404
28
+ Layer 27: 0.997411
29
+ Layer 28: 0.997892
30
+ Layer 29: 0.999704
31
+ Layer 30: 0.997883
32
+ Layer 31: 1.003333
checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0226
2
+ Test Accuracy: 0.9942
checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 0.0236
2
+ Test Accuracy: 0.9940
checkpoints/residual_beta_clutrr_llama_train_correct_3/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 4
3
+ lr: 5e-06
4
+ seed: 3
5
+ checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
6
+ output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_3