lestienne commited on
Commit
f9856f3
·
verified ·
1 Parent(s): 01b6325

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500015.gamma.1536692.0 +3 -0
  2. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  3. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737499999.gamma.1536345.0 +3 -0
  4. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  5. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500006.gamma.1536464.0 +3 -0
  6. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  7. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500012.gamma.1536578.0 +3 -0
  8. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  9. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500233.gamma.1538502.0 +3 -0
  10. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  11. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500241.gamma.1538698.0 +3 -0
  12. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  13. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500247.gamma.1538878.0 +3 -0
  14. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500725.gamma.1543513.0 +3 -0
  15. calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  16. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549564.gamma.1638424.0 +3 -0
  17. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  18. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549528.gamma.1638002.0 +3 -0
  19. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  20. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549538.gamma.1638140.0 +3 -0
  21. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  22. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549544.gamma.1638289.0 +3 -0
  23. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  24. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  25. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  26. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550451.gamma.1644992.0 +3 -0
  27. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  28. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550413.gamma.1644570.0 +3 -0
  29. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  30. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550422.gamma.1644707.0 +3 -0
  31. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  32. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550428.gamma.1644828.0 +3 -0
  33. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  34. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550884.gamma.1647198.0 +3 -0
  35. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  36. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550865.gamma.1646832.0 +3 -0
  37. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  38. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550874.gamma.1646964.0 +3 -0
  39. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  40. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550881.gamma.1647081.0 +3 -0
  41. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  42. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551331.gamma.1648831.0 +3 -0
  43. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  44. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551298.gamma.1648450.0 +3 -0
  45. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  46. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551307.gamma.1648582.0 +3 -0
  47. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  48. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551313.gamma.1648699.0 +3 -0
  49. calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt +3 -0
  50. finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/config.json +39 -0
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500015.gamma.1536692.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:659a539e737edaa2aeafe8b62470c1c9bcd9e0e78042af4073f7f615fc5b96eb
3
+ size 309890
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6d642ac60ca833f3726db86f282ffa67f68b2d02d5bf7b2f770048968e2080
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737499999.gamma.1536345.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af6b00d4c96c18d5da99f19b94a9954ddfee8d5631428ae19941e7ebd3c6e042
3
+ size 350866
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81f2f35c4d2ec89c4e4e78c4eff3d39ba3c6072daf800760c5beb6cb82705314
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500006.gamma.1536464.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c13b8870204a67e5697d98d77b54088196a0718905ff8427189e886024dd4da5
3
+ size 209386
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa527e8c8110319ff9b435664983945d6744e97e178df0c26a1955f40269a75a
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500012.gamma.1536578.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bcdeb98534784d8cdf7528d3be1f8d3d82d1a2451ec378b23b63a33343ce54f
3
+ size 58802
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32dc8f282ed7accd041e25c0583ac3b7838df0c94b3e9259ef6a33c756e5d3b9
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500233.gamma.1538502.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0e7cd3e4f8b25d82fc3b1a68d21020840fa34b0eac1f032c7b9827dd2015189
3
+ size 371082
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db27831e7a9a4f9f69db5597d197402f3b43169c2e994c271a02dfd7b982e953
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500241.gamma.1538698.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aafd37b80ddb9ef012de0b5314324966c2aa7c1e2bb78e7395c5ef136b3fb15
3
+ size 231450
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5171cc25225a88fc7ed546bcbbc39ff906b90bddf4b9baed5bb78b0b2d8dd19
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500247.gamma.1538878.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d30195178aa65fbf58bcace9ef55342a16110e736d81ccdc28aadb7d5b45a11c
3
+ size 117782
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737500725.gamma.1543513.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbcf5bf56f0b9bdf5b92323c5d1fae14daf64d3b2d3d9c531ef36f74e14e192b
3
+ size 94190
calibration/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a4b2875aa477a90738956360dae1de5c6e9aae31ed40dc85fd5613d69de9b91
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549564.gamma.1638424.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0de210a9ec493f778618f7d39e01d338b12e30a46779de7e8b2659c7fbe6f50
3
+ size 308518
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/bias_shift/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe816942c45370cf7ad87d7eb97fa72f387db03d96a22febdf578c7b0c99ca11
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549528.gamma.1638002.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bd065e3c12aec66920abe51b39801768916f4f3d9685c6073f019c7d6188168
3
+ size 382598
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa1a3db865f4fbec33a6f204bae46e262d49bd11a08df52df312f32d4d1ccaf7
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549538.gamma.1638140.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef88797aad3e462c0e08ccf73070fd4099f5bb37e358d2667e0569c447c1896
3
+ size 219270
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73d991e61c00be28105b0dd5de7c9a8b7b25d56c6edb7929921bb8019088d97
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737549544.gamma.1638289.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d14b0afcb18ce1f813b092943f62f89cb575701711fb3235ed8c59bd9e3bdea4
3
+ size 887066
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ccdfc4c23c6be9819c20669ab469c6f707e5fe0857a88e324225b50b4c712b0
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28948420a62e5ae849ec22800183de278e0fb20c9a59ba1769d71c120f2b86ce
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cfa347080c4f9eb32669cd38b696712e3d4129de05060daf167e8b530d8a39f
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550451.gamma.1644992.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e97f6d2dcb0bd1c46ac651eaacba046583e5463fd6b992e85518efb1fa9290a7
3
+ size 325754
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/bias_shift/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b7bdf554533d6997c58330838e275e675e0550061ee77579a56a47d5b585ea9
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550413.gamma.1644570.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e72497aeb76e24e578cf74136a5ab3b28986f4d1c3a92e727f42d1585ea804f2
3
+ size 360914
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e43c34a71f8ff353250a798a8bd47f870edd546f20c5cc0d8a7919290cd63f9
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550422.gamma.1644707.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99b4f9b8f38f1ceabb94669ac354bf95b508e0e47b5573c2bb9cf58a92d4c6c9
3
+ size 212558
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:749687e06f2e13d4c9fd0a0d624a9f897ca983120c4d174ec9f762207e121abb
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550428.gamma.1644828.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cafbde1efd2dc632a264a9dab0cd022d170a36d0891e8b5ba749dd30d7bd2232
3
+ size 934130
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b0054108ca1f224fc7ca16d148bc0040c5f2323714ebc11936cf8b93b417098
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550884.gamma.1647198.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7069f55f0e6bb45523be4be9f8b878ce3c8ee6becfb7756e25a7acb67d90b9a2
3
+ size 325582
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/bias_shift/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75aa4ea3f36e4eae0e187ef030143e7d165a4c88d596022bd71441eb728da4cf
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550865.gamma.1646832.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbc506b10f44b9bf9458cfe1c7f47497a3d6a2d9bfed561f8d5df5c688445056
3
+ size 378458
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aec0b0d3e6a0b44372f370b807bcb5d2de71605643dbf5039e31395ce4981af
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550874.gamma.1646964.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17c499d9b93142b7f0c4a64265a13425316858cf1f9c5189b38565ec8fd2cd57
3
+ size 231742
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93ee258f9cb0e49eb9d95f558a9c36b35da0c849857057ba9aa4a9fbb13e88f1
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737550881.gamma.1647081.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb7099e5aca8b04a326c00b3f922266ebe85cd8b2d2334f83a49b4bc1f337a3f
3
+ size 105986
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6b5eda58c05e26cd29db75422b5e979942b8b30a2c67bb2af6a1d07715ddf50
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551331.gamma.1648831.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c4667a002ab5a5771e89f3e43790037ba17c2415c4baf53d25da5638d5e1dcc
3
+ size 326622
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/bias_shift/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7488e8ac755c0561f4dfed03af819367c2201dac0c10240d4cb91a695d569d5
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551298.gamma.1648450.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95727ff61462cece451bbd3e92fac6cf0456e5e6786846c1d6c7d4928371d14f
3
+ size 384122
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/dp_calibration/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c72b027226a7eb4c3a01596d712dbfbf245de13be8ee6995894a4bf56ef104e
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551307.gamma.1648582.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ef0bc98192f3ca06f880c48ff6d71e00e5ca25325bec3ff8c51a295a0c2ea2
3
+ size 221578
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/temp_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da016dd516c613f6327b956ea152d07176b55fc398b4123d825467e2bf5f88f6
3
+ size 1740
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/logs/events.out.tfevents.1737551313.gamma.1648699.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8754fbd37ded81e8124ca66f3e41f58698e4e2ea8f9f8594d061c1b9741f26bd
3
+ size 799678
calibration/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/vector_scaling/0.0-1.0/0.0-1.0/state.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eca72dad6edf966aee3eaaa08b73f7d761f7283ac5fdccb1ceff1ee494f0209
3
+ size 1740
finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 128000,
8
+ "eos_token_id": [
9
+ 128001,
10
+ 128008,
11
+ 128009
12
+ ],
13
+ "head_dim": 64,
14
+ "hidden_act": "silu",
15
+ "hidden_size": 2048,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 8192,
18
+ "max_position_embeddings": 131072,
19
+ "mlp_bias": false,
20
+ "model_type": "llama",
21
+ "num_attention_heads": 32,
22
+ "num_hidden_layers": 16,
23
+ "num_key_value_heads": 8,
24
+ "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 32.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": true,
35
+ "torch_dtype": "bfloat16",
36
+ "transformers_version": "4.45.0.dev0",
37
+ "use_cache": true,
38
+ "vocab_size": 128256
39
+ }