RuidiChang commited on
Commit
caa2a83
·
verified ·
1 Parent(s): ed92b4f

Sync missing vs SOURCE into TARGET under 'checkpoints' (batch 7, +50 files)

Browse files
Files changed (50) hide show
  1. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/config.txt +6 -0
  2. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.pt +3 -0
  3. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.txt +24 -0
  4. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics.txt +2 -0
  5. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics_before.txt +2 -0
  6. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/config.txt +6 -0
  7. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.pt +3 -0
  8. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.txt +24 -0
  9. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics.txt +2 -0
  10. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics_before.txt +2 -0
  11. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/config.txt +6 -0
  12. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.pt +3 -0
  13. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.txt +24 -0
  14. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/test_metrics_before.txt +2 -0
  15. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/config.txt +6 -0
  16. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.pt +3 -0
  17. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.txt +24 -0
  18. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics.txt +2 -0
  19. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics_before.txt +2 -0
  20. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/config.txt +6 -0
  21. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.pt +3 -0
  22. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.txt +24 -0
  23. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics.txt +2 -0
  24. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics_before.txt +2 -0
  25. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/config.txt +6 -0
  26. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.pt +3 -0
  27. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.txt +24 -0
  28. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics.txt +2 -0
  29. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics_before.txt +2 -0
  30. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/config.txt +6 -0
  31. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.pt +3 -0
  32. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.txt +24 -0
  33. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics.txt +2 -0
  34. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics_before.txt +2 -0
  35. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/config.txt +6 -0
  36. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.pt +3 -0
  37. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.txt +24 -0
  38. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/test_metrics_before.txt +2 -0
  39. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/config.txt +6 -0
  40. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.pt +3 -0
  41. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.txt +24 -0
  42. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics.txt +2 -0
  43. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics_before.txt +2 -0
  44. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/config.txt +6 -0
  45. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.pt +3 -0
  46. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.txt +24 -0
  47. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics.txt +2 -0
  48. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics_before.txt +2 -0
  49. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/config.txt +6 -0
  50. checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/final_betas.pt +3 -0
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ec8aa784af858b9dbadd298b1a8287e53b83e49c10a8158d483d155df7e05a7
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000146
2
+ Layer 1: 1.000061
3
+ Layer 2: 1.000154
4
+ Layer 3: 1.000082
5
+ Layer 4: 0.999892
6
+ Layer 5: 0.999872
7
+ Layer 6: 0.999877
8
+ Layer 7: 1.000151
9
+ Layer 8: 1.000153
10
+ Layer 9: 0.999899
11
+ Layer 10: 0.999869
12
+ Layer 11: 0.999845
13
+ Layer 12: 0.999841
14
+ Layer 13: 1.000128
15
+ Layer 14: 1.000091
16
+ Layer 15: 0.999871
17
+ Layer 16: 0.999961
18
+ Layer 17: 1.000145
19
+ Layer 18: 1.000103
20
+ Layer 19: 1.000005
21
+ Layer 20: 0.999842
22
+ Layer 21: 1.000116
23
+ Layer 22: 0.999855
24
+ Layer 23: 1.000049
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4055
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4091
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 5
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95702e55da289a0b8494bd6e5400d0d1830b7a24c51acd6fd1ae5078d8696491
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000226
2
+ Layer 1: 1.000219
3
+ Layer 2: 1.000252
4
+ Layer 3: 1.000103
5
+ Layer 4: 0.999762
6
+ Layer 5: 0.999922
7
+ Layer 6: 0.999992
8
+ Layer 7: 1.000247
9
+ Layer 8: 1.000198
10
+ Layer 9: 0.999792
11
+ Layer 10: 0.999807
12
+ Layer 11: 0.999734
13
+ Layer 12: 0.999739
14
+ Layer 13: 0.999964
15
+ Layer 14: 1.000038
16
+ Layer 15: 0.999855
17
+ Layer 16: 0.999795
18
+ Layer 17: 1.000256
19
+ Layer 18: 1.000233
20
+ Layer 19: 1.000032
21
+ Layer 20: 0.999748
22
+ Layer 21: 1.000211
23
+ Layer 22: 0.999767
24
+ Layer 23: 1.000104
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 4.0870
2
+ Test Accuracy: 0.4506
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 4.0911
2
+ Test Accuracy: 0.4506
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d35932d084b4582bfdffc12a97b911a9bfe84189f74825648bd86332c6051a0
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.002702
2
+ Layer 1: 1.002368
3
+ Layer 2: 1.002750
4
+ Layer 3: 1.000241
5
+ Layer 4: 0.997064
6
+ Layer 5: 0.999475
7
+ Layer 6: 0.997436
8
+ Layer 7: 1.000434
9
+ Layer 8: 1.001455
10
+ Layer 9: 0.997719
11
+ Layer 10: 1.000210
12
+ Layer 11: 0.997204
13
+ Layer 12: 0.997816
14
+ Layer 13: 1.000603
15
+ Layer 14: 1.001274
16
+ Layer 15: 0.998692
17
+ Layer 16: 1.001638
18
+ Layer 17: 1.002667
19
+ Layer 18: 0.997705
20
+ Layer 19: 0.999324
21
+ Layer 20: 0.996989
22
+ Layer 21: 0.999316
23
+ Layer 22: 0.997883
24
+ Layer 23: 1.001790
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 3.3787
2
+ Test Accuracy: 0.4416
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 10
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 0
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-72
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e12d1ed7b9028807dd713872d39e3798aa6a8badb7631baa025bfc9c7adc3f05
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 0.999622
2
+ Layer 1: 1.000431
3
+ Layer 2: 1.001851
4
+ Layer 3: 1.000636
5
+ Layer 4: 1.000028
6
+ Layer 5: 0.999593
7
+ Layer 6: 1.001501
8
+ Layer 7: 1.001937
9
+ Layer 8: 1.000608
10
+ Layer 9: 0.998138
11
+ Layer 10: 0.999010
12
+ Layer 11: 0.998071
13
+ Layer 12: 0.998215
14
+ Layer 13: 1.001478
15
+ Layer 14: 1.001404
16
+ Layer 15: 1.000400
17
+ Layer 16: 0.997987
18
+ Layer 17: 1.001807
19
+ Layer 18: 1.001886
20
+ Layer 19: 1.000023
21
+ Layer 20: 0.997924
22
+ Layer 21: 1.001831
23
+ Layer 22: 0.997960
24
+ Layer 23: 1.001933
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 1.2903
2
+ Test Accuracy: 0.5284
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 1.2988
2
+ Test Accuracy: 0.5254
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cacc6b34ad88242836c930290b8c88b7eb8e644a422561833f7996fa7a7b0e09
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000347
2
+ Layer 1: 1.000353
3
+ Layer 2: 1.000068
4
+ Layer 3: 1.000365
5
+ Layer 4: 0.999955
6
+ Layer 5: 0.999837
7
+ Layer 6: 0.999764
8
+ Layer 7: 1.000164
9
+ Layer 8: 1.000091
10
+ Layer 9: 0.999845
11
+ Layer 10: 0.999830
12
+ Layer 11: 0.999602
13
+ Layer 12: 0.999656
14
+ Layer 13: 0.999956
15
+ Layer 14: 0.999963
16
+ Layer 15: 0.999686
17
+ Layer 16: 1.000408
18
+ Layer 17: 1.000397
19
+ Layer 18: 0.999666
20
+ Layer 19: 0.999864
21
+ Layer 20: 0.999607
22
+ Layer 21: 0.999888
23
+ Layer 22: 0.999946
24
+ Layer 23: 1.000424
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.2827
2
+ Test Accuracy: 0.2901
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.2859
2
+ Test Accuracy: 0.2891
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 5
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f819fe0687f669869f996d2a7232deb7218ad86aeda25975fc357fd3f93b481
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000037
2
+ Layer 1: 1.000029
3
+ Layer 2: 1.000036
4
+ Layer 3: 1.000025
5
+ Layer 4: 0.999968
6
+ Layer 5: 0.999962
7
+ Layer 6: 0.999965
8
+ Layer 7: 1.000034
9
+ Layer 8: 1.000037
10
+ Layer 9: 0.999976
11
+ Layer 10: 0.999965
12
+ Layer 11: 0.999961
13
+ Layer 12: 0.999963
14
+ Layer 13: 1.000014
15
+ Layer 14: 1.000010
16
+ Layer 15: 0.999965
17
+ Layer 16: 0.999995
18
+ Layer 17: 1.000038
19
+ Layer 18: 1.000028
20
+ Layer 19: 1.000015
21
+ Layer 20: 0.999963
22
+ Layer 21: 1.000033
23
+ Layer 22: 0.999964
24
+ Layer 23: 1.000017
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4082
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4091
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16e2d18d3d5e4433d05f2aabe9004df7a2f7ba7696057d27f96c9eca7567dc91
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000148
2
+ Layer 1: 1.000062
3
+ Layer 2: 1.000157
4
+ Layer 3: 1.000092
5
+ Layer 4: 0.999862
6
+ Layer 5: 0.999862
7
+ Layer 6: 0.999859
8
+ Layer 7: 1.000152
9
+ Layer 8: 1.000156
10
+ Layer 9: 0.999890
11
+ Layer 10: 0.999887
12
+ Layer 11: 0.999850
13
+ Layer 12: 0.999844
14
+ Layer 13: 1.000109
15
+ Layer 14: 1.000067
16
+ Layer 15: 0.999888
17
+ Layer 16: 0.999977
18
+ Layer 17: 1.000146
19
+ Layer 18: 1.000116
20
+ Layer 19: 1.000003
21
+ Layer 20: 0.999856
22
+ Layer 21: 1.000133
23
+ Layer 22: 0.999858
24
+ Layer 23: 1.000063
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4055
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4091
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 1
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d587c824c162236d009fc70a41bae4eb65b6359c92a3103432c0f68de63fdf8a
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.002667
2
+ Layer 1: 1.002316
3
+ Layer 2: 1.002842
4
+ Layer 3: 1.000266
5
+ Layer 4: 0.997047
6
+ Layer 5: 0.999469
7
+ Layer 6: 0.997509
8
+ Layer 7: 1.000430
9
+ Layer 8: 1.001477
10
+ Layer 9: 0.997662
11
+ Layer 10: 1.000166
12
+ Layer 11: 0.997214
13
+ Layer 12: 0.997769
14
+ Layer 13: 1.000648
15
+ Layer 14: 1.001307
16
+ Layer 15: 0.998655
17
+ Layer 16: 1.001639
18
+ Layer 17: 1.002717
19
+ Layer 18: 0.997743
20
+ Layer 19: 0.999275
21
+ Layer 20: 0.997016
22
+ Layer 21: 0.999369
23
+ Layer 22: 0.997829
24
+ Layer 23: 1.001885
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 3.3787
2
+ Test Accuracy: 0.4416
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd2a70386f4d0f80686f1564cb59f99203366a6c6e0226dac8d9bf915c67152
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000291
2
+ Layer 1: 1.000355
3
+ Layer 2: 1.000052
4
+ Layer 3: 1.000314
5
+ Layer 4: 0.999943
6
+ Layer 5: 0.999886
7
+ Layer 6: 0.999795
8
+ Layer 7: 1.000184
9
+ Layer 8: 1.000067
10
+ Layer 9: 0.999857
11
+ Layer 10: 0.999808
12
+ Layer 11: 0.999593
13
+ Layer 12: 0.999660
14
+ Layer 13: 0.999982
15
+ Layer 14: 0.999981
16
+ Layer 15: 0.999664
17
+ Layer 16: 1.000403
18
+ Layer 17: 1.000389
19
+ Layer 18: 0.999671
20
+ Layer 19: 0.999880
21
+ Layer 20: 0.999605
22
+ Layer 21: 0.999844
23
+ Layer 22: 0.999943
24
+ Layer 23: 1.000423
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.2828
2
+ Test Accuracy: 0.2901
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.2859
2
+ Test Accuracy: 0.2891
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 5
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34c9a4bd1d6446394b664214d2ad467cf9ef2a84638069c1f598eaefd654be6e
3
+ size 1264
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.txt ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Layer 0: 1.000035
2
+ Layer 1: 1.000015
3
+ Layer 2: 1.000033
4
+ Layer 3: 1.000008
5
+ Layer 4: 0.999968
6
+ Layer 5: 0.999964
7
+ Layer 6: 0.999967
8
+ Layer 7: 1.000033
9
+ Layer 8: 1.000037
10
+ Layer 9: 0.999973
11
+ Layer 10: 0.999964
12
+ Layer 11: 0.999962
13
+ Layer 12: 0.999963
14
+ Layer 13: 1.000026
15
+ Layer 14: 1.000014
16
+ Layer 15: 0.999969
17
+ Layer 16: 0.999997
18
+ Layer 17: 1.000038
19
+ Layer 18: 1.000031
20
+ Layer 19: 0.999985
21
+ Layer 20: 0.999961
22
+ Layer 21: 1.000034
23
+ Layer 22: 0.999964
24
+ Layer 23: 0.999993
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4082
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics_before.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Test Loss: 5.4091
2
+ Test Accuracy: 0.3555
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/config.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epochs: 3
2
+ batch_size: 16
3
+ lr: 5e-06
4
+ seed: 2
5
+ checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
6
+ output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/final_betas.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffcb2a5601334b7e0f4a5d95e21f0f24ea6c624de1f3287c74b87661b6209c3f
3
+ size 1264