Sync missing vs SOURCE into TARGET under 'checkpoints' (batch 4, +50 files)
Browse files- checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_0/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_0/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_0/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_0/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_0/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_1/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_1/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_1/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_1/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_1/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_2/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_2/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_2/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_2/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_2/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_3/config_new.txt +6 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_3/final_betas_new.pt +3 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_3/final_betas_new.txt +12 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_3/test_metrics_before_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_3/test_metrics_new.txt +2 -0
- checkpoints/residual_beta_clutrr_gpt2_train_correct_42/config_new.txt +6 -0
checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:762079830b8a54ff716ec90426cf189e1ad1fe4597228568452c639f9b96cf0e
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000489
|
| 2 |
+
Layer 1: 1.000476
|
| 3 |
+
Layer 2: 1.000012
|
| 4 |
+
Layer 3: 1.000001
|
| 5 |
+
Layer 4: 0.999990
|
| 6 |
+
Layer 5: 0.999674
|
| 7 |
+
Layer 6: 1.000200
|
| 8 |
+
Layer 7: 1.000267
|
| 9 |
+
Layer 8: 1.000156
|
| 10 |
+
Layer 9: 0.999520
|
| 11 |
+
Layer 10: 0.999556
|
| 12 |
+
Layer 11: 0.999477
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_checkingcode/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9636
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d5bcb932e4d015134485bf8549af767cfae282715e6e97d95b264d6d40efebe
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000508
|
| 2 |
+
Layer 1: 1.000363
|
| 3 |
+
Layer 2: 1.000153
|
| 4 |
+
Layer 3: 1.000277
|
| 5 |
+
Layer 4: 1.000370
|
| 6 |
+
Layer 5: 0.999774
|
| 7 |
+
Layer 6: 0.999505
|
| 8 |
+
Layer 7: 0.999486
|
| 9 |
+
Layer 8: 0.999477
|
| 10 |
+
Layer 9: 0.999512
|
| 11 |
+
Layer 10: 0.999538
|
| 12 |
+
Layer 11: 0.999611
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_0/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9612
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6ec58135c104007fc14308385098aed075a58cd7140e9a7df046bc1a4daf1cb
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000494
|
| 2 |
+
Layer 1: 1.000410
|
| 3 |
+
Layer 2: 0.999985
|
| 4 |
+
Layer 3: 0.999895
|
| 5 |
+
Layer 4: 1.000292
|
| 6 |
+
Layer 5: 0.999776
|
| 7 |
+
Layer 6: 0.999503
|
| 8 |
+
Layer 7: 0.999499
|
| 9 |
+
Layer 8: 0.999488
|
| 10 |
+
Layer 9: 0.999519
|
| 11 |
+
Layer 10: 0.999594
|
| 12 |
+
Layer 11: 0.999579
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_1/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9613
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:899f44739505920bf78e4f18d76338da1fd22b0717e4fe6d6f9efa80cde6b560
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000485
|
| 2 |
+
Layer 1: 1.000385
|
| 3 |
+
Layer 2: 1.000144
|
| 4 |
+
Layer 3: 0.999785
|
| 5 |
+
Layer 4: 1.000276
|
| 6 |
+
Layer 5: 1.000005
|
| 7 |
+
Layer 6: 0.999636
|
| 8 |
+
Layer 7: 0.999571
|
| 9 |
+
Layer 8: 0.999487
|
| 10 |
+
Layer 9: 0.999516
|
| 11 |
+
Layer 10: 0.999569
|
| 12 |
+
Layer 11: 0.999777
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_2/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9616
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 3
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea715191ec203f98d50f0abbf7062ea2ca140c1f11a1c55b6b92bc2e5a9a1fcc
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000511
|
| 2 |
+
Layer 1: 1.000356
|
| 3 |
+
Layer 2: 1.000039
|
| 4 |
+
Layer 3: 0.999923
|
| 5 |
+
Layer 4: 1.000333
|
| 6 |
+
Layer 5: 0.999933
|
| 7 |
+
Layer 6: 0.999501
|
| 8 |
+
Layer 7: 0.999537
|
| 9 |
+
Layer 8: 0.999474
|
| 10 |
+
Layer 9: 0.999535
|
| 11 |
+
Layer 10: 0.999688
|
| 12 |
+
Layer 11: 0.999647
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_3/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9614
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 42
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:253e2eb48ea33f76082c01d2936dc37f8c859f8330e2d34e4bcf3e63d9c558f2
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 1.000500
|
| 2 |
+
Layer 1: 1.000426
|
| 3 |
+
Layer 2: 0.999948
|
| 4 |
+
Layer 3: 1.000143
|
| 5 |
+
Layer 4: 1.000222
|
| 6 |
+
Layer 5: 1.000103
|
| 7 |
+
Layer 6: 0.999491
|
| 8 |
+
Layer 7: 0.999485
|
| 9 |
+
Layer 8: 0.999483
|
| 10 |
+
Layer 9: 0.999544
|
| 11 |
+
Layer 10: 0.999709
|
| 12 |
+
Layer 11: 0.999537
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9655
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_test_ood_correct_42/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 6.9615
|
| 2 |
+
Test Accuracy: 0.2124
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_0/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 0
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_train_correct_0
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_0/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:774bf2a83aab35a5783b5647cc6be35c65f69a42af1d9334b1c30fc59047eabe
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_0/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.999636
|
| 2 |
+
Layer 1: 0.999896
|
| 3 |
+
Layer 2: 0.999829
|
| 4 |
+
Layer 3: 0.998708
|
| 5 |
+
Layer 4: 1.000324
|
| 6 |
+
Layer 5: 1.000809
|
| 7 |
+
Layer 6: 0.999786
|
| 8 |
+
Layer 7: 0.999835
|
| 9 |
+
Layer 8: 1.000335
|
| 10 |
+
Layer 9: 1.000188
|
| 11 |
+
Layer 10: 0.999609
|
| 12 |
+
Layer 11: 1.001174
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_0/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_0/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_1/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 1
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_train_correct_1
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_1/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a65a10c94cc840d488b2e787f8ddad866df7fa5fcde425de24f64c5be261424a
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_1/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.998699
|
| 2 |
+
Layer 1: 1.000081
|
| 3 |
+
Layer 2: 0.999607
|
| 4 |
+
Layer 3: 1.000792
|
| 5 |
+
Layer 4: 1.001033
|
| 6 |
+
Layer 5: 1.001055
|
| 7 |
+
Layer 6: 1.000667
|
| 8 |
+
Layer 7: 0.999984
|
| 9 |
+
Layer 8: 0.999738
|
| 10 |
+
Layer 9: 0.999291
|
| 11 |
+
Layer 10: 1.001172
|
| 12 |
+
Layer 11: 1.000791
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_1/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_1/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_2/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 2
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_train_correct_2
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_2/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba7d437f0450ad2b918d232016c16ba95d38c7f38c7096bfc3f3196ff390f642
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_2/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.999878
|
| 2 |
+
Layer 1: 0.999095
|
| 3 |
+
Layer 2: 1.000362
|
| 4 |
+
Layer 3: 0.999807
|
| 5 |
+
Layer 4: 1.000084
|
| 6 |
+
Layer 5: 1.000041
|
| 7 |
+
Layer 6: 1.000339
|
| 8 |
+
Layer 7: 0.999619
|
| 9 |
+
Layer 8: 0.999739
|
| 10 |
+
Layer 9: 0.999950
|
| 11 |
+
Layer 10: 0.999249
|
| 12 |
+
Layer 11: 1.000993
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_2/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_2/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_3/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 3
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_train_correct_3
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_3/final_betas_new.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8bc57c1040dfe34c650b53c540876b4f37dff4c71ab87a5a7dc163b3644f0fbc
|
| 3 |
+
size 1220
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_3/final_betas_new.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Layer 0: 0.998813
|
| 2 |
+
Layer 1: 0.999242
|
| 3 |
+
Layer 2: 0.999722
|
| 4 |
+
Layer 3: 0.999500
|
| 5 |
+
Layer 4: 1.000859
|
| 6 |
+
Layer 5: 1.001143
|
| 7 |
+
Layer 6: 1.000974
|
| 8 |
+
Layer 7: 1.000347
|
| 9 |
+
Layer 8: 0.999898
|
| 10 |
+
Layer 9: 0.999706
|
| 11 |
+
Layer 10: 0.999855
|
| 12 |
+
Layer 11: 1.000684
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_3/test_metrics_before_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_3/test_metrics_new.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Test Loss: 0.0287
|
| 2 |
+
Test Accuracy: 0.9868
|
checkpoints/residual_beta_clutrr_gpt2_train_correct_42/config_new.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epochs: 5
|
| 2 |
+
batch_size: 32
|
| 3 |
+
lr: 5e-05
|
| 4 |
+
seed: 42
|
| 5 |
+
checkpoint_dir: checkpoints/clutrr_gpt2/checkpoint-720
|
| 6 |
+
output_dir: checkpoints/residual_beta_clutrr_gpt2_train_correct_42
|