Sync missing vs SOURCE into TARGET under 'checkpoints' (batch 7, +50 files)
Browse files- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.txt +24 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/config.txt +6 -0
- checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/final_betas.pt +3 -0
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ec8aa784af858b9dbadd298b1a8287e53b83e49c10a8158d483d155df7e05a7
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000146
|
| 2 |
+
Layer 1: 1.000061
|
| 3 |
+
Layer 2: 1.000154
|
| 4 |
+
Layer 3: 1.000082
|
| 5 |
+
Layer 4: 0.999892
|
| 6 |
+
Layer 5: 0.999872
|
| 7 |
+
Layer 6: 0.999877
|
| 8 |
+
Layer 7: 1.000151
|
| 9 |
+
Layer 8: 1.000153
|
| 10 |
+
Layer 9: 0.999899
|
| 11 |
+
Layer 10: 0.999869
|
| 12 |
+
Layer 11: 0.999845
|
| 13 |
+
Layer 12: 0.999841
|
| 14 |
+
Layer 13: 1.000128
|
| 15 |
+
Layer 14: 1.000091
|
| 16 |
+
Layer 15: 0.999871
|
| 17 |
+
Layer 16: 0.999961
|
| 18 |
+
Layer 17: 1.000145
|
| 19 |
+
Layer 18: 1.000103
|
| 20 |
+
Layer 19: 1.000005
|
| 21 |
+
Layer 20: 0.999842
|
| 22 |
+
Layer 21: 1.000116
|
| 23 |
+
Layer 22: 0.999855
|
| 24 |
+
Layer 23: 1.000049
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4055
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_3/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4091
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95702e55da289a0b8494bd6e5400d0d1830b7a24c51acd6fd1ae5078d8696491
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000226
|
| 2 |
+
Layer 1: 1.000219
|
| 3 |
+
Layer 2: 1.000252
|
| 4 |
+
Layer 3: 1.000103
|
| 5 |
+
Layer 4: 0.999762
|
| 6 |
+
Layer 5: 0.999922
|
| 7 |
+
Layer 6: 0.999992
|
| 8 |
+
Layer 7: 1.000247
|
| 9 |
+
Layer 8: 1.000198
|
| 10 |
+
Layer 9: 0.999792
|
| 11 |
+
Layer 10: 0.999807
|
| 12 |
+
Layer 11: 0.999734
|
| 13 |
+
Layer 12: 0.999739
|
| 14 |
+
Layer 13: 0.999964
|
| 15 |
+
Layer 14: 1.000038
|
| 16 |
+
Layer 15: 0.999855
|
| 17 |
+
Layer 16: 0.999795
|
| 18 |
+
Layer 17: 1.000256
|
| 19 |
+
Layer 18: 1.000233
|
| 20 |
+
Layer 19: 1.000032
|
| 21 |
+
Layer 20: 0.999748
|
| 22 |
+
Layer 21: 1.000211
|
| 23 |
+
Layer 22: 0.999767
|
| 24 |
+
Layer 23: 1.000104
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 4.0870
|
| 2 |
+
Test Accuracy: 0.4506
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_irr/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 4.0911
|
| 2 |
+
Test Accuracy: 0.4506
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d35932d084b4582bfdffc12a97b911a9bfe84189f74825648bd86332c6051a0
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.002702
|
| 2 |
+
Layer 1: 1.002368
|
| 3 |
+
Layer 2: 1.002750
|
| 4 |
+
Layer 3: 1.000241
|
| 5 |
+
Layer 4: 0.997064
|
| 6 |
+
Layer 5: 0.999475
|
| 7 |
+
Layer 6: 0.997436
|
| 8 |
+
Layer 7: 1.000434
|
| 9 |
+
Layer 8: 1.001455
|
| 10 |
+
Layer 9: 0.997719
|
| 11 |
+
Layer 10: 1.000210
|
| 12 |
+
Layer 11: 0.997204
|
| 13 |
+
Layer 12: 0.997816
|
| 14 |
+
Layer 13: 1.000603
|
| 15 |
+
Layer 14: 1.001274
|
| 16 |
+
Layer 15: 0.998692
|
| 17 |
+
Layer 16: 1.001638
|
| 18 |
+
Layer 17: 1.002667
|
| 19 |
+
Layer 18: 0.997705
|
| 20 |
+
Layer 19: 0.999324
|
| 21 |
+
Layer 20: 0.996989
|
| 22 |
+
Layer 21: 0.999316
|
| 23 |
+
Layer 22: 0.997883
|
| 24 |
+
Layer 23: 1.001790
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_360_sup/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 3.3787
|
| 2 |
+
Test Accuracy: 0.4416
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 10
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-72
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e12d1ed7b9028807dd713872d39e3798aa6a8badb7631baa025bfc9c7adc3f05
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.999622
|
| 2 |
+
Layer 1: 1.000431
|
| 3 |
+
Layer 2: 1.001851
|
| 4 |
+
Layer 3: 1.000636
|
| 5 |
+
Layer 4: 1.000028
|
| 6 |
+
Layer 5: 0.999593
|
| 7 |
+
Layer 6: 1.001501
|
| 8 |
+
Layer 7: 1.001937
|
| 9 |
+
Layer 8: 1.000608
|
| 10 |
+
Layer 9: 0.998138
|
| 11 |
+
Layer 10: 0.999010
|
| 12 |
+
Layer 11: 0.998071
|
| 13 |
+
Layer 12: 0.998215
|
| 14 |
+
Layer 13: 1.001478
|
| 15 |
+
Layer 14: 1.001404
|
| 16 |
+
Layer 15: 1.000400
|
| 17 |
+
Layer 16: 0.997987
|
| 18 |
+
Layer 17: 1.001807
|
| 19 |
+
Layer 18: 1.001886
|
| 20 |
+
Layer 19: 1.000023
|
| 21 |
+
Layer 20: 0.997924
|
| 22 |
+
Layer 21: 1.001831
|
| 23 |
+
Layer 22: 0.997960
|
| 24 |
+
Layer 23: 1.001933
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 1.2903
|
| 2 |
+
Test Accuracy: 0.5284
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_0_72/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 1.2988
|
| 2 |
+
Test Accuracy: 0.5254
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cacc6b34ad88242836c930290b8c88b7eb8e644a422561833f7996fa7a7b0e09
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000347
|
| 2 |
+
Layer 1: 1.000353
|
| 3 |
+
Layer 2: 1.000068
|
| 4 |
+
Layer 3: 1.000365
|
| 5 |
+
Layer 4: 0.999955
|
| 6 |
+
Layer 5: 0.999837
|
| 7 |
+
Layer 6: 0.999764
|
| 8 |
+
Layer 7: 1.000164
|
| 9 |
+
Layer 8: 1.000091
|
| 10 |
+
Layer 9: 0.999845
|
| 11 |
+
Layer 10: 0.999830
|
| 12 |
+
Layer 11: 0.999602
|
| 13 |
+
Layer 12: 0.999656
|
| 14 |
+
Layer 13: 0.999956
|
| 15 |
+
Layer 14: 0.999963
|
| 16 |
+
Layer 15: 0.999686
|
| 17 |
+
Layer 16: 1.000408
|
| 18 |
+
Layer 17: 1.000397
|
| 19 |
+
Layer 18: 0.999666
|
| 20 |
+
Layer 19: 0.999864
|
| 21 |
+
Layer 20: 0.999607
|
| 22 |
+
Layer 21: 0.999888
|
| 23 |
+
Layer 22: 0.999946
|
| 24 |
+
Layer 23: 1.000424
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.2827
|
| 2 |
+
Test Accuracy: 0.2901
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.2859
|
| 2 |
+
Test Accuracy: 0.2891
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f819fe0687f669869f996d2a7232deb7218ad86aeda25975fc357fd3f93b481
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000037
|
| 2 |
+
Layer 1: 1.000029
|
| 3 |
+
Layer 2: 1.000036
|
| 4 |
+
Layer 3: 1.000025
|
| 5 |
+
Layer 4: 0.999968
|
| 6 |
+
Layer 5: 0.999962
|
| 7 |
+
Layer 6: 0.999965
|
| 8 |
+
Layer 7: 1.000034
|
| 9 |
+
Layer 8: 1.000037
|
| 10 |
+
Layer 9: 0.999976
|
| 11 |
+
Layer 10: 0.999965
|
| 12 |
+
Layer 11: 0.999961
|
| 13 |
+
Layer 12: 0.999963
|
| 14 |
+
Layer 13: 1.000014
|
| 15 |
+
Layer 14: 1.000010
|
| 16 |
+
Layer 15: 0.999965
|
| 17 |
+
Layer 16: 0.999995
|
| 18 |
+
Layer 17: 1.000038
|
| 19 |
+
Layer 18: 1.000028
|
| 20 |
+
Layer 19: 1.000015
|
| 21 |
+
Layer 20: 0.999963
|
| 22 |
+
Layer 21: 1.000033
|
| 23 |
+
Layer 22: 0.999964
|
| 24 |
+
Layer 23: 1.000017
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4082
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4091
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16e2d18d3d5e4433d05f2aabe9004df7a2f7ba7696057d27f96c9eca7567dc91
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000148
|
| 2 |
+
Layer 1: 1.000062
|
| 3 |
+
Layer 2: 1.000157
|
| 4 |
+
Layer 3: 1.000092
|
| 5 |
+
Layer 4: 0.999862
|
| 6 |
+
Layer 5: 0.999862
|
| 7 |
+
Layer 6: 0.999859
|
| 8 |
+
Layer 7: 1.000152
|
| 9 |
+
Layer 8: 1.000156
|
| 10 |
+
Layer 9: 0.999890
|
| 11 |
+
Layer 10: 0.999887
|
| 12 |
+
Layer 11: 0.999850
|
| 13 |
+
Layer 12: 0.999844
|
| 14 |
+
Layer 13: 1.000109
|
| 15 |
+
Layer 14: 1.000067
|
| 16 |
+
Layer 15: 0.999888
|
| 17 |
+
Layer 16: 0.999977
|
| 18 |
+
Layer 17: 1.000146
|
| 19 |
+
Layer 18: 1.000116
|
| 20 |
+
Layer 19: 1.000003
|
| 21 |
+
Layer 20: 0.999856
|
| 22 |
+
Layer 21: 1.000133
|
| 23 |
+
Layer 22: 0.999858
|
| 24 |
+
Layer 23: 1.000063
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4055
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_3/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4091
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d587c824c162236d009fc70a41bae4eb65b6359c92a3103432c0f68de63fdf8a
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.002667
|
| 2 |
+
Layer 1: 1.002316
|
| 3 |
+
Layer 2: 1.002842
|
| 4 |
+
Layer 3: 1.000266
|
| 5 |
+
Layer 4: 0.997047
|
| 6 |
+
Layer 5: 0.999469
|
| 7 |
+
Layer 6: 0.997509
|
| 8 |
+
Layer 7: 1.000430
|
| 9 |
+
Layer 8: 1.001477
|
| 10 |
+
Layer 9: 0.997662
|
| 11 |
+
Layer 10: 1.000166
|
| 12 |
+
Layer 11: 0.997214
|
| 13 |
+
Layer 12: 0.997769
|
| 14 |
+
Layer 13: 1.000648
|
| 15 |
+
Layer 14: 1.001307
|
| 16 |
+
Layer 15: 0.998655
|
| 17 |
+
Layer 16: 1.001639
|
| 18 |
+
Layer 17: 1.002717
|
| 19 |
+
Layer 18: 0.997743
|
| 20 |
+
Layer 19: 0.999275
|
| 21 |
+
Layer 20: 0.997016
|
| 22 |
+
Layer 21: 0.999369
|
| 23 |
+
Layer 22: 0.997829
|
| 24 |
+
Layer 23: 1.001885
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_1_360_sup/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 3.3787
|
| 2 |
+
Test Accuracy: 0.4416
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fd2a70386f4d0f80686f1564cb59f99203366a6c6e0226dac8d9bf915c67152
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000291
|
| 2 |
+
Layer 1: 1.000355
|
| 3 |
+
Layer 2: 1.000052
|
| 4 |
+
Layer 3: 1.000314
|
| 5 |
+
Layer 4: 0.999943
|
| 6 |
+
Layer 5: 0.999886
|
| 7 |
+
Layer 6: 0.999795
|
| 8 |
+
Layer 7: 1.000184
|
| 9 |
+
Layer 8: 1.000067
|
| 10 |
+
Layer 9: 0.999857
|
| 11 |
+
Layer 10: 0.999808
|
| 12 |
+
Layer 11: 0.999593
|
| 13 |
+
Layer 12: 0.999660
|
| 14 |
+
Layer 13: 0.999982
|
| 15 |
+
Layer 14: 0.999981
|
| 16 |
+
Layer 15: 0.999664
|
| 17 |
+
Layer 16: 1.000403
|
| 18 |
+
Layer 17: 1.000389
|
| 19 |
+
Layer 18: 0.999671
|
| 20 |
+
Layer 19: 0.999880
|
| 21 |
+
Layer 20: 0.999605
|
| 22 |
+
Layer 21: 0.999844
|
| 23 |
+
Layer 22: 0.999943
|
| 24 |
+
Layer 23: 1.000423
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.2828
|
| 2 |
+
Test Accuracy: 0.2901
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.2859
|
| 2 |
+
Test Accuracy: 0.2891
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:34c9a4bd1d6446394b664214d2ad467cf9ef2a84638069c1f598eaefd654be6e
|
| 3 |
+
size 1264
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/final_betas.txt
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000035
|
| 2 |
+
Layer 1: 1.000015
|
| 3 |
+
Layer 2: 1.000033
|
| 4 |
+
Layer 3: 1.000008
|
| 5 |
+
Layer 4: 0.999968
|
| 6 |
+
Layer 5: 0.999964
|
| 7 |
+
Layer 6: 0.999967
|
| 8 |
+
Layer 7: 1.000033
|
| 9 |
+
Layer 8: 1.000037
|
| 10 |
+
Layer 9: 0.999973
|
| 11 |
+
Layer 10: 0.999964
|
| 12 |
+
Layer 11: 0.999962
|
| 13 |
+
Layer 12: 0.999963
|
| 14 |
+
Layer 13: 1.000026
|
| 15 |
+
Layer 14: 1.000014
|
| 16 |
+
Layer 15: 0.999969
|
| 17 |
+
Layer 16: 0.999997
|
| 18 |
+
Layer 17: 1.000038
|
| 19 |
+
Layer 18: 1.000031
|
| 20 |
+
Layer 19: 0.999985
|
| 21 |
+
Layer 20: 0.999961
|
| 22 |
+
Layer 21: 1.000034
|
| 23 |
+
Layer 22: 0.999964
|
| 24 |
+
Layer 23: 0.999993
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4082
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 5.4091
|
| 2 |
+
Test Accuracy: 0.3555
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 16
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_qwen/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3
|
checkpoints/residual_beta_clutrr_qwen_test_ood_correct_2_360_3/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffcb2a5601334b7e0f4a5d95e21f0f24ea6c624de1f3287c74b87661b6209c3f
|
| 3 |
+
size 1264
|