Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500015.gamma.1536692.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737499999.gamma.1536345.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500006.gamma.1536464.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500012.gamma.1536578.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500233.gamma.1538502.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500241.gamma.1538698.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500247.gamma.1538878.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500725.gamma.1543513.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549564.gamma.1638424.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549528.gamma.1638002.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549538.gamma.1638140.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549544.gamma.1638289.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550451.gamma.1644992.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550413.gamma.1644570.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550422.gamma.1644707.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550428.gamma.1644828.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550884.gamma.1647198.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550865.gamma.1646832.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550874.gamma.1646964.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550881.gamma.1647081.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551331.gamma.1648831.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551298.gamma.1648450.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551307.gamma.1648582.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551313.gamma.1648699.0 +3 -0
- calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
- finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/config.json +39 -0
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500015.gamma.1536692.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:659a539e737edaa2aeafe8b62470c1c9bcd9e0e78042af4073f7f615fc5b96eb
|
| 3 |
+
size 309890
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c6d642ac60ca833f3726db86f282ffa67f68b2d02d5bf7b2f770048968e2080
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737499999.gamma.1536345.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af6b00d4c96c18d5da99f19b94a9954ddfee8d5631428ae19941e7ebd3c6e042
|
| 3 |
+
size 350866
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81f2f35c4d2ec89c4e4e78c4eff3d39ba3c6072daf800760c5beb6cb82705314
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500006.gamma.1536464.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c13b8870204a67e5697d98d77b54088196a0718905ff8427189e886024dd4da5
|
| 3 |
+
size 209386
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa527e8c8110319ff9b435664983945d6744e97e178df0c26a1955f40269a75a
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500012.gamma.1536578.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bcdeb98534784d8cdf7528d3be1f8d3d82d1a2451ec378b23b63a33343ce54f
|
| 3 |
+
size 58802
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32dc8f282ed7accd041e25c0583ac3b7838df0c94b3e9259ef6a33c756e5d3b9
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500233.gamma.1538502.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0e7cd3e4f8b25d82fc3b1a68d21020840fa34b0eac1f032c7b9827dd2015189
|
| 3 |
+
size 371082
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db27831e7a9a4f9f69db5597d197402f3b43169c2e994c271a02dfd7b982e953
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500241.gamma.1538698.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2aafd37b80ddb9ef012de0b5314324966c2aa7c1e2bb78e7395c5ef136b3fb15
|
| 3 |
+
size 231450
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5171cc25225a88fc7ed546bcbbc39ff906b90bddf4b9baed5bb78b0b2d8dd19
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500247.gamma.1538878.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d30195178aa65fbf58bcace9ef55342a16110e736d81ccdc28aadb7d5b45a11c
|
| 3 |
+
size 117782
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500725.gamma.1543513.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbcf5bf56f0b9bdf5b92323c5d1fae14daf64d3b2d3d9c531ef36f74e14e192b
|
| 3 |
+
size 94190
|
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a4b2875aa477a90738956360dae1de5c6e9aae31ed40dc85fd5613d69de9b91
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549564.gamma.1638424.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0de210a9ec493f778618f7d39e01d338b12e30a46779de7e8b2659c7fbe6f50
|
| 3 |
+
size 308518
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe816942c45370cf7ad87d7eb97fa72f387db03d96a22febdf578c7b0c99ca11
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549528.gamma.1638002.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bd065e3c12aec66920abe51b39801768916f4f3d9685c6073f019c7d6188168
|
| 3 |
+
size 382598
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa1a3db865f4fbec33a6f204bae46e262d49bd11a08df52df312f32d4d1ccaf7
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549538.gamma.1638140.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ef88797aad3e462c0e08ccf73070fd4099f5bb37e358d2667e0569c447c1896
|
| 3 |
+
size 219270
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c73d991e61c00be28105b0dd5de7c9a8b7b25d56c6edb7929921bb8019088d97
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549544.gamma.1638289.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d14b0afcb18ce1f813b092943f62f89cb575701711fb3235ed8c59bd9e3bdea4
|
| 3 |
+
size 887066
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ccdfc4c23c6be9819c20669ab469c6f707e5fe0857a88e324225b50b4c712b0
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28948420a62e5ae849ec22800183de278e0fb20c9a59ba1769d71c120f2b86ce
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cfa347080c4f9eb32669cd38b696712e3d4129de05060daf167e8b530d8a39f
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550451.gamma.1644992.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e97f6d2dcb0bd1c46ac651eaacba046583e5463fd6b992e85518efb1fa9290a7
|
| 3 |
+
size 325754
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b7bdf554533d6997c58330838e275e675e0550061ee77579a56a47d5b585ea9
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550413.gamma.1644570.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e72497aeb76e24e578cf74136a5ab3b28986f4d1c3a92e727f42d1585ea804f2
|
| 3 |
+
size 360914
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e43c34a71f8ff353250a798a8bd47f870edd546f20c5cc0d8a7919290cd63f9
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550422.gamma.1644707.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99b4f9b8f38f1ceabb94669ac354bf95b508e0e47b5573c2bb9cf58a92d4c6c9
|
| 3 |
+
size 212558
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:749687e06f2e13d4c9fd0a0d624a9f897ca983120c4d174ec9f762207e121abb
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550428.gamma.1644828.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cafbde1efd2dc632a264a9dab0cd022d170a36d0891e8b5ba749dd30d7bd2232
|
| 3 |
+
size 934130
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b0054108ca1f224fc7ca16d148bc0040c5f2323714ebc11936cf8b93b417098
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550884.gamma.1647198.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7069f55f0e6bb45523be4be9f8b878ce3c8ee6becfb7756e25a7acb67d90b9a2
|
| 3 |
+
size 325582
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75aa4ea3f36e4eae0e187ef030143e7d165a4c88d596022bd71441eb728da4cf
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550865.gamma.1646832.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbc506b10f44b9bf9458cfe1c7f47497a3d6a2d9bfed561f8d5df5c688445056
|
| 3 |
+
size 378458
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0aec0b0d3e6a0b44372f370b807bcb5d2de71605643dbf5039e31395ce4981af
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550874.gamma.1646964.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17c499d9b93142b7f0c4a64265a13425316858cf1f9c5189b38565ec8fd2cd57
|
| 3 |
+
size 231742
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93ee258f9cb0e49eb9d95f558a9c36b35da0c849857057ba9aa4a9fbb13e88f1
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550881.gamma.1647081.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb7099e5aca8b04a326c00b3f922266ebe85cd8b2d2334f83a49b4bc1f337a3f
|
| 3 |
+
size 105986
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6b5eda58c05e26cd29db75422b5e979942b8b30a2c67bb2af6a1d07715ddf50
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551331.gamma.1648831.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c4667a002ab5a5771e89f3e43790037ba17c2415c4baf53d25da5638d5e1dcc
|
| 3 |
+
size 326622
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7488e8ac755c0561f4dfed03af819367c2201dac0c10240d4cb91a695d569d5
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551298.gamma.1648450.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95727ff61462cece451bbd3e92fac6cf0456e5e6786846c1d6c7d4928371d14f
|
| 3 |
+
size 384122
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c72b027226a7eb4c3a01596d712dbfbf245de13be8ee6995894a4bf56ef104e
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551307.gamma.1648582.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:49ef0bc98192f3ca06f880c48ff6d71e00e5ca25325bec3ff8c51a295a0c2ea2
|
| 3 |
+
size 221578
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da016dd516c613f6327b956ea152d07176b55fc398b4123d825467e2bf5f88f6
|
| 3 |
+
size 1740
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551313.gamma.1648699.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8754fbd37ded81e8124ca66f3e41f58698e4e2ea8f9f8594d061c1b9741f26bd
|
| 3 |
+
size 799678
|
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6eca72dad6edf966aee3eaaa08b73f7d761f7283ac5fdccb1ceff1ee494f0209
|
| 3 |
+
size 1740
|
finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/config.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"LlamaForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": false,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": 128000,
|
| 8 |
+
"eos_token_id": [
|
| 9 |
+
128001,
|
| 10 |
+
128008,
|
| 11 |
+
128009
|
| 12 |
+
],
|
| 13 |
+
"head_dim": 64,
|
| 14 |
+
"hidden_act": "silu",
|
| 15 |
+
"hidden_size": 2048,
|
| 16 |
+
"initializer_range": 0.02,
|
| 17 |
+
"intermediate_size": 8192,
|
| 18 |
+
"max_position_embeddings": 131072,
|
| 19 |
+
"mlp_bias": false,
|
| 20 |
+
"model_type": "llama",
|
| 21 |
+
"num_attention_heads": 32,
|
| 22 |
+
"num_hidden_layers": 16,
|
| 23 |
+
"num_key_value_heads": 8,
|
| 24 |
+
"pretraining_tp": 1,
|
| 25 |
+
"rms_norm_eps": 1e-05,
|
| 26 |
+
"rope_scaling": {
|
| 27 |
+
"factor": 32.0,
|
| 28 |
+
"high_freq_factor": 4.0,
|
| 29 |
+
"low_freq_factor": 1.0,
|
| 30 |
+
"original_max_position_embeddings": 8192,
|
| 31 |
+
"rope_type": "llama3"
|
| 32 |
+
},
|
| 33 |
+
"rope_theta": 500000.0,
|
| 34 |
+
"tie_word_embeddings": true,
|
| 35 |
+
"torch_dtype": "bfloat16",
|
| 36 |
+
"transformers_version": "4.45.0.dev0",
|
| 37 |
+
"use_cache": true,
|
| 38 |
+
"vocab_size": 128256
|
| 39 |
+
}
|