Sync missing vs SOURCE into TARGET under 'checkpoints' (batch 5, +50 files)
Browse files- checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_0/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_1/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_2/config.txt +6 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.pt +3 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.txt +32 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics_before.txt +2 -0
- checkpoints/residual_beta_clutrr_llama_train_correct_3/config.txt +6 -0
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a49cd7851544a295dcd0158056c68f37e96c890a72d06bbb575deb36bc6add63
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.999653
|
| 2 |
+
Layer 1: 1.000033
|
| 3 |
+
Layer 2: 1.000485
|
| 4 |
+
Layer 3: 1.000472
|
| 5 |
+
Layer 4: 1.000640
|
| 6 |
+
Layer 5: 1.000615
|
| 7 |
+
Layer 6: 1.000651
|
| 8 |
+
Layer 7: 0.999653
|
| 9 |
+
Layer 8: 0.999722
|
| 10 |
+
Layer 9: 0.999756
|
| 11 |
+
Layer 10: 0.999356
|
| 12 |
+
Layer 11: 1.000359
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9aa06dfc1284e02e2e7728e6b995c26b83e397fd4d5daee0451f4bfc3d4e29a
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000076
|
| 2 |
+
Layer 1: 0.999903
|
| 3 |
+
Layer 2: 1.000117
|
| 4 |
+
Layer 3: 1.000051
|
| 5 |
+
Layer 4: 1.000268
|
| 6 |
+
Layer 5: 0.999983
|
| 7 |
+
Layer 6: 0.999930
|
| 8 |
+
Layer 7: 0.999788
|
| 9 |
+
Layer 8: 0.999786
|
| 10 |
+
Layer 9: 0.999840
|
| 11 |
+
Layer 10: 1.000265
|
| 12 |
+
Layer 11: 0.999614
|
| 13 |
+
Layer 12: 0.999760
|
| 14 |
+
Layer 13: 0.999672
|
| 15 |
+
Layer 14: 1.000397
|
| 16 |
+
Layer 15: 1.000151
|
| 17 |
+
Layer 16: 0.999691
|
| 18 |
+
Layer 17: 0.999929
|
| 19 |
+
Layer 18: 1.000166
|
| 20 |
+
Layer 19: 0.999558
|
| 21 |
+
Layer 20: 1.000380
|
| 22 |
+
Layer 21: 1.000044
|
| 23 |
+
Layer 22: 0.999544
|
| 24 |
+
Layer 23: 1.000252
|
| 25 |
+
Layer 24: 1.000250
|
| 26 |
+
Layer 25: 0.999792
|
| 27 |
+
Layer 26: 1.000169
|
| 28 |
+
Layer 27: 0.999551
|
| 29 |
+
Layer 28: 1.000153
|
| 30 |
+
Layer 29: 1.000162
|
| 31 |
+
Layer 30: 1.000268
|
| 32 |
+
Layer 31: 1.000337
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1291
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1332
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_llama/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_360_sup
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_0_5_sup
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b45f03c6fb18352fe0f2a676974d31d079e74a074eb451d7b48633112093c782
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000057
|
| 2 |
+
Layer 1: 0.999892
|
| 3 |
+
Layer 2: 1.000131
|
| 4 |
+
Layer 3: 1.000091
|
| 5 |
+
Layer 4: 1.000279
|
| 6 |
+
Layer 5: 0.999976
|
| 7 |
+
Layer 6: 0.999942
|
| 8 |
+
Layer 7: 0.999838
|
| 9 |
+
Layer 8: 0.999756
|
| 10 |
+
Layer 9: 0.999839
|
| 11 |
+
Layer 10: 1.000284
|
| 12 |
+
Layer 11: 0.999585
|
| 13 |
+
Layer 12: 0.999785
|
| 14 |
+
Layer 13: 0.999654
|
| 15 |
+
Layer 14: 1.000371
|
| 16 |
+
Layer 15: 1.000184
|
| 17 |
+
Layer 16: 0.999707
|
| 18 |
+
Layer 17: 0.999920
|
| 19 |
+
Layer 18: 1.000166
|
| 20 |
+
Layer 19: 0.999567
|
| 21 |
+
Layer 20: 1.000366
|
| 22 |
+
Layer 21: 1.000078
|
| 23 |
+
Layer 22: 0.999533
|
| 24 |
+
Layer 23: 1.000281
|
| 25 |
+
Layer 24: 1.000284
|
| 26 |
+
Layer 25: 0.999787
|
| 27 |
+
Layer 26: 1.000183
|
| 28 |
+
Layer 27: 0.999543
|
| 29 |
+
Layer 28: 1.000109
|
| 30 |
+
Layer 29: 1.000183
|
| 31 |
+
Layer 30: 1.000251
|
| 32 |
+
Layer 31: 1.000286
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1291
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1332
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_llama/checkpoint-360
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_360_sup
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_1_5_sup
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_2
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38be78b41c49822a2ea338a85880daf6dbffff3cf4c2e625fa38b98c0562cff2
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000049
|
| 2 |
+
Layer 1: 0.999899
|
| 3 |
+
Layer 2: 1.000125
|
| 4 |
+
Layer 3: 1.000065
|
| 5 |
+
Layer 4: 1.000246
|
| 6 |
+
Layer 5: 1.000024
|
| 7 |
+
Layer 6: 0.999946
|
| 8 |
+
Layer 7: 0.999762
|
| 9 |
+
Layer 8: 0.999763
|
| 10 |
+
Layer 9: 0.999902
|
| 11 |
+
Layer 10: 1.000269
|
| 12 |
+
Layer 11: 0.999593
|
| 13 |
+
Layer 12: 0.999716
|
| 14 |
+
Layer 13: 0.999663
|
| 15 |
+
Layer 14: 1.000386
|
| 16 |
+
Layer 15: 1.000159
|
| 17 |
+
Layer 16: 0.999684
|
| 18 |
+
Layer 17: 0.999871
|
| 19 |
+
Layer 18: 1.000162
|
| 20 |
+
Layer 19: 0.999569
|
| 21 |
+
Layer 20: 1.000359
|
| 22 |
+
Layer 21: 1.000065
|
| 23 |
+
Layer 22: 0.999560
|
| 24 |
+
Layer 23: 1.000259
|
| 25 |
+
Layer 24: 1.000261
|
| 26 |
+
Layer 25: 0.999805
|
| 27 |
+
Layer 26: 1.000163
|
| 28 |
+
Layer 27: 0.999591
|
| 29 |
+
Layer 28: 1.000092
|
| 30 |
+
Layer 29: 1.000202
|
| 31 |
+
Layer 30: 1.000239
|
| 32 |
+
Layer 31: 1.000287
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1292
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1332
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_2_5_sup
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 3
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_3
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37025576941bfc28183a87a9f943e3f91d68211ea9bb8632f0bbc5f1423a961e
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000044
|
| 2 |
+
Layer 1: 0.999919
|
| 3 |
+
Layer 2: 1.000139
|
| 4 |
+
Layer 3: 1.000065
|
| 5 |
+
Layer 4: 1.000301
|
| 6 |
+
Layer 5: 1.000002
|
| 7 |
+
Layer 6: 0.999924
|
| 8 |
+
Layer 7: 0.999817
|
| 9 |
+
Layer 8: 0.999759
|
| 10 |
+
Layer 9: 0.999882
|
| 11 |
+
Layer 10: 1.000232
|
| 12 |
+
Layer 11: 0.999656
|
| 13 |
+
Layer 12: 0.999739
|
| 14 |
+
Layer 13: 0.999704
|
| 15 |
+
Layer 14: 1.000372
|
| 16 |
+
Layer 15: 1.000132
|
| 17 |
+
Layer 16: 0.999701
|
| 18 |
+
Layer 17: 0.999889
|
| 19 |
+
Layer 18: 1.000138
|
| 20 |
+
Layer 19: 0.999565
|
| 21 |
+
Layer 20: 1.000427
|
| 22 |
+
Layer 21: 1.000082
|
| 23 |
+
Layer 22: 0.999549
|
| 24 |
+
Layer 23: 1.000314
|
| 25 |
+
Layer 24: 1.000259
|
| 26 |
+
Layer 25: 0.999759
|
| 27 |
+
Layer 26: 1.000139
|
| 28 |
+
Layer 27: 0.999559
|
| 29 |
+
Layer 28: 1.000105
|
| 30 |
+
Layer 29: 1.000153
|
| 31 |
+
Layer 30: 1.000232
|
| 32 |
+
Layer 31: 1.000292
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1292
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_3/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1332
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 42
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_test_ood_correct_42
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6847fcceea2ef09b014f6cdec124a5da538353a4bf654bf1a74f1848fd0fd98a
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000038
|
| 2 |
+
Layer 1: 0.999942
|
| 3 |
+
Layer 2: 1.000114
|
| 4 |
+
Layer 3: 1.000136
|
| 5 |
+
Layer 4: 1.000243
|
| 6 |
+
Layer 5: 1.000004
|
| 7 |
+
Layer 6: 0.999921
|
| 8 |
+
Layer 7: 0.999820
|
| 9 |
+
Layer 8: 0.999825
|
| 10 |
+
Layer 9: 0.999864
|
| 11 |
+
Layer 10: 1.000246
|
| 12 |
+
Layer 11: 0.999663
|
| 13 |
+
Layer 12: 0.999800
|
| 14 |
+
Layer 13: 0.999628
|
| 15 |
+
Layer 14: 1.000331
|
| 16 |
+
Layer 15: 1.000161
|
| 17 |
+
Layer 16: 0.999700
|
| 18 |
+
Layer 17: 0.999922
|
| 19 |
+
Layer 18: 1.000136
|
| 20 |
+
Layer 19: 0.999544
|
| 21 |
+
Layer 20: 1.000375
|
| 22 |
+
Layer 21: 1.000083
|
| 23 |
+
Layer 22: 0.999531
|
| 24 |
+
Layer 23: 1.000296
|
| 25 |
+
Layer 24: 1.000268
|
| 26 |
+
Layer 25: 0.999740
|
| 27 |
+
Layer 26: 1.000129
|
| 28 |
+
Layer 27: 0.999552
|
| 29 |
+
Layer 28: 1.000087
|
| 30 |
+
Layer 29: 1.000152
|
| 31 |
+
Layer 30: 1.000218
|
| 32 |
+
Layer 31: 1.000292
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1293
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_test_ood_correct_42/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 2.1332
|
| 2 |
+
Test Accuracy: 0.6358
|
checkpoints/residual_beta_clutrr_llama_train_correct_0/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_0
|
checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4fd60511989382bad3dd2d079448b464c20e588f75ee0bb90add31794121aa9
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_train_correct_0/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.001698
|
| 2 |
+
Layer 1: 0.997893
|
| 3 |
+
Layer 2: 1.001930
|
| 4 |
+
Layer 3: 0.998901
|
| 5 |
+
Layer 4: 0.998956
|
| 6 |
+
Layer 5: 0.999694
|
| 7 |
+
Layer 6: 1.000498
|
| 8 |
+
Layer 7: 0.999588
|
| 9 |
+
Layer 8: 1.000236
|
| 10 |
+
Layer 9: 1.002018
|
| 11 |
+
Layer 10: 1.000320
|
| 12 |
+
Layer 11: 0.998410
|
| 13 |
+
Layer 12: 1.000116
|
| 14 |
+
Layer 13: 1.002069
|
| 15 |
+
Layer 14: 0.997052
|
| 16 |
+
Layer 15: 0.999062
|
| 17 |
+
Layer 16: 0.998260
|
| 18 |
+
Layer 17: 1.000410
|
| 19 |
+
Layer 18: 0.998667
|
| 20 |
+
Layer 19: 0.999585
|
| 21 |
+
Layer 20: 1.001028
|
| 22 |
+
Layer 21: 1.001209
|
| 23 |
+
Layer 22: 0.997678
|
| 24 |
+
Layer 23: 0.996642
|
| 25 |
+
Layer 24: 1.002759
|
| 26 |
+
Layer 25: 0.996454
|
| 27 |
+
Layer 26: 0.999449
|
| 28 |
+
Layer 27: 0.997274
|
| 29 |
+
Layer 28: 0.997749
|
| 30 |
+
Layer 29: 0.999731
|
| 31 |
+
Layer 30: 0.997755
|
| 32 |
+
Layer 31: 1.003472
|
checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0226
|
| 2 |
+
Test Accuracy: 0.9942
|
checkpoints/residual_beta_clutrr_llama_train_correct_0/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0236
|
| 2 |
+
Test Accuracy: 0.9940
|
checkpoints/residual_beta_clutrr_llama_train_correct_1/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_1
|
checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8689cc6cca13b75bd3cf6de8ae694e0750ae2a7cc766a1599e9aeaf52144c9f
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_train_correct_1/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.001549
|
| 2 |
+
Layer 1: 0.997922
|
| 3 |
+
Layer 2: 1.001824
|
| 4 |
+
Layer 3: 0.998915
|
| 5 |
+
Layer 4: 0.998898
|
| 6 |
+
Layer 5: 0.999670
|
| 7 |
+
Layer 6: 1.000539
|
| 8 |
+
Layer 7: 0.999587
|
| 9 |
+
Layer 8: 1.000297
|
| 10 |
+
Layer 9: 1.002017
|
| 11 |
+
Layer 10: 1.000371
|
| 12 |
+
Layer 11: 0.998439
|
| 13 |
+
Layer 12: 1.000070
|
| 14 |
+
Layer 13: 1.002052
|
| 15 |
+
Layer 14: 0.997161
|
| 16 |
+
Layer 15: 0.999056
|
| 17 |
+
Layer 16: 0.998278
|
| 18 |
+
Layer 17: 1.000382
|
| 19 |
+
Layer 18: 0.998720
|
| 20 |
+
Layer 19: 0.999580
|
| 21 |
+
Layer 20: 1.001064
|
| 22 |
+
Layer 21: 1.001211
|
| 23 |
+
Layer 22: 0.997648
|
| 24 |
+
Layer 23: 0.996551
|
| 25 |
+
Layer 24: 1.002808
|
| 26 |
+
Layer 25: 0.996599
|
| 27 |
+
Layer 26: 0.999425
|
| 28 |
+
Layer 27: 0.997328
|
| 29 |
+
Layer 28: 0.997917
|
| 30 |
+
Layer 29: 0.999739
|
| 31 |
+
Layer 30: 0.997880
|
| 32 |
+
Layer 31: 1.003539
|
checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0227
|
| 2 |
+
Test Accuracy: 0.9942
|
checkpoints/residual_beta_clutrr_llama_train_correct_1/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0236
|
| 2 |
+
Test Accuracy: 0.9940
|
checkpoints/residual_beta_clutrr_llama_train_correct_2/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_2
|
checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f5201d946ab22599688df17dff73fd79a6fd3f457887d7c94107bdd88a3be9f
|
| 3 |
+
size 1648
|
checkpoints/residual_beta_clutrr_llama_train_correct_2/final_betas.txt
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.001709
|
| 2 |
+
Layer 1: 0.997907
|
| 3 |
+
Layer 2: 1.001903
|
| 4 |
+
Layer 3: 0.998951
|
| 5 |
+
Layer 4: 0.998942
|
| 6 |
+
Layer 5: 0.999700
|
| 7 |
+
Layer 6: 1.000541
|
| 8 |
+
Layer 7: 0.999545
|
| 9 |
+
Layer 8: 1.000248
|
| 10 |
+
Layer 9: 1.002025
|
| 11 |
+
Layer 10: 1.000368
|
| 12 |
+
Layer 11: 0.998406
|
| 13 |
+
Layer 12: 0.999990
|
| 14 |
+
Layer 13: 1.002042
|
| 15 |
+
Layer 14: 0.997180
|
| 16 |
+
Layer 15: 0.999018
|
| 17 |
+
Layer 16: 0.998291
|
| 18 |
+
Layer 17: 1.000450
|
| 19 |
+
Layer 18: 0.998765
|
| 20 |
+
Layer 19: 0.999521
|
| 21 |
+
Layer 20: 1.000991
|
| 22 |
+
Layer 21: 1.001229
|
| 23 |
+
Layer 22: 0.997614
|
| 24 |
+
Layer 23: 0.996626
|
| 25 |
+
Layer 24: 1.002810
|
| 26 |
+
Layer 25: 0.996541
|
| 27 |
+
Layer 26: 0.999404
|
| 28 |
+
Layer 27: 0.997411
|
| 29 |
+
Layer 28: 0.997892
|
| 30 |
+
Layer 29: 0.999704
|
| 31 |
+
Layer 30: 0.997883
|
| 32 |
+
Layer 31: 1.003333
|
checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0226
|
| 2 |
+
Test Accuracy: 0.9942
|
checkpoints/residual_beta_clutrr_llama_train_correct_2/test_metrics_before.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0236
|
| 2 |
+
Test Accuracy: 0.9940
|
checkpoints/residual_beta_clutrr_llama_train_correct_3/config.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 3
|
| 2 |
+
batch_size: 4
|
| 3 |
+
lr: 5e-06
|
| 4 |
+
seed: 3
|
| 5 |
+
checkpoint_dir: checkpoints/checkpoints/clutrr_llama3_8b/checkpoint_epoch_5
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_llama_train_correct_3
|