diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349096.gamma.2163059.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349096.gamma.2163059.0 new file mode 100644 index 0000000000000000000000000000000000000000..98ccf5d5e6f902fcd26437332176acb3c4ae946c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349096.gamma.2163059.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f6c07ab5fe11259f584fd6b7276f45ca96968c06decb15e68f13cbc616d75a +size 247090 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..c6ac28a1ee4d4b8251f1296a9cbe29a2e4e779f8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d37af384b532d89b7bfe151604e72529467647cec1c1838efff06a56afad4f +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735348908.gamma.2161969.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735348908.gamma.2161969.0 new file mode 100644 index 0000000000000000000000000000000000000000..783e31669f1f74934f80509a89a1d87d95ea0f6b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735348908.gamma.2161969.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feca193f7d9f9f8909528a73f613a8361e46d0738edd9a4fdda7abd2e14f787e +size 247962 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..2782aba4de05b1839e45688f19e21205dfb98b37 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068aa4ab6ebe881534254715a7ac7018211f34ab5145147dda81b5927875f737 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349230.gamma.2165293.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349230.gamma.2165293.0 new file mode 100644 index 0000000000000000000000000000000000000000..626410d206e763b7188fc1548818331fea2d3b51 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349230.gamma.2165293.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a0d55d3b2369224998805f3023ac1522d10cb74c3c68f344e7b86dd8282dd8 +size 206418 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..196a2ab6844e98d3a225bf7c7709d6914fee88f1 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc45e5b70785384b5fe1bb414ca6504213ac31ad34ccc9fd3384924ae21d7793 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349172.gamma.2164349.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349172.gamma.2164349.0 new file mode 100644 index 0000000000000000000000000000000000000000..f931a046d58831149247320ccbf346bac8d6aa68 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349172.gamma.2164349.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c242814d34ffd4ec9526129fd2c6d137f326fee42a61f60ea86bc35c26226823 +size 268766 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..ef286e815f172d9968692549f1915187ace7534b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efb7694f179cd9b9187c6c0749b18e3018df2bba8909910ca170b03d4e660a65 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349357.gamma.2167437.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349357.gamma.2167437.0 new file mode 100644 index 0000000000000000000000000000000000000000..0c10962bde6fc56fca4ebe53e5ce5c7c6a965959 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349357.gamma.2167437.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ded1c9b96aeb8f99a6bd62a14e4cd49339e8cc7483e73290f92644c8365eb6 +size 157772 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..95a053a65c5569f31ed3b3cb3f47f492ba8fd120 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799ed0450aa054f49da0194b851b14108313d25aba689554386ccd66f0d76a5d +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349304.gamma.2166507.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349304.gamma.2166507.0 new file mode 100644 index 0000000000000000000000000000000000000000..32b0d8ef0729a62cf7186b8908d70b2126c60139 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349304.gamma.2166507.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ee42e2b828b68a8efbbbaa28a5a47a42629b0dd61521c51ee15bc275852eb7 +size 255910 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e253891211b78a058bb2bf658f926b1b9c30e8db --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0c50ddf114f0c81e84ad76ca8d13fd02097daf56dfb013a1f3df3b3b3a8d8d +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349486.gamma.2169573.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349486.gamma.2169573.0 new file mode 100644 index 0000000000000000000000000000000000000000..c15b8d1d0e67dd661670b6df6d8990b8ecfe8a22 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349486.gamma.2169573.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05eaf7f7886d6e20c5e6782e172c83dc6c09ef683ef5455acbb8f11169001851 +size 189194 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..4f273dd8c10a91fe9d4eded26fad9687bd9f7469 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413edbde9f438209b082f6aeab8c7232415948673880f8ac182624ed2d470c48 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349430.gamma.2168638.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349430.gamma.2168638.0 new file mode 100644 index 0000000000000000000000000000000000000000..7424f7c227b9304db582143ed65e896e57fbcef7 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349430.gamma.2168638.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66e8d391f000590637a3713111cf10fb89cd33f414d715d79d2714d44c5b7e0 +size 257686 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..6d97ee38a2fe077676528d47b300fe700856a1fb --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7718a731e59d55dd3907eece58e0ff7f13c14a98013827f1cf6bd3cfa9b2ef1a +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349609.gamma.2171699.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349609.gamma.2171699.0 new file mode 100644 index 0000000000000000000000000000000000000000..80373f1611dc0bfdfac8f7959c3b4fae6ad26e1d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349609.gamma.2171699.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f55c6cbbdbe4071253e02f2415b5ab687e8d6af9ea40944f9fecddc1e2ae3ab +size 240262 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349556.gamma.2170773.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349556.gamma.2170773.0 new file mode 100644 index 0000000000000000000000000000000000000000..a34d05e2c560fe20f7839b96e84c38dd4f90dabc --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735349556.gamma.2170773.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9968b85d948dec8b96a524ba51cdf4ab9b9f4ba744bace4e87c4746701e94a +size 245690 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..0bf3f54ae44ff8dbb0f4970d28e084a94b0b9083 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab8868f5d966cf8c3b0bdfa4afc47e4a098c92a7276a6f48ca99b5011ea13b8 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983302.gamma.3374690.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983302.gamma.3374690.0 new file mode 100644 index 0000000000000000000000000000000000000000..b1df650e6038bf41841d0fde79cae19d1889ec93 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983302.gamma.3374690.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1d5cfd1692d8e1d8ccea5e3d3dac0ab9497e648f0aea0698d87c6d114dad53 +size 155772 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..5f5e12b5fb69ae21c86d86f0a369ca313a1e8d3d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d13e577b150822f6d388b545c947384238a94d728f0f678b633fea111500ea +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983243.gamma.3373748.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983243.gamma.3373748.0 new file mode 100644 index 0000000000000000000000000000000000000000..896b038211538f1509147f688382e29c8b10b2ba --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983243.gamma.3373748.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5dfc36feed1f107ac6c44f85a2dcbb18e6b3f3d13ae61b7c33a3c6f8fb9904 +size 246370 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e125fa548c1c4fac71842eff0e9f52c998800b5d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b89ae006c3fbbe8ea34cfb16bc8141bc61b605a65929d3c21e5c9129bdf127 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983462.gamma.3376885.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983462.gamma.3376885.0 new file mode 100644 index 0000000000000000000000000000000000000000..94fa4d76bdbb8ab559e533d9e37bee4ba429cc55 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983462.gamma.3376885.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b461e9df4de8d14ac64e4419a3e6fca3a02f17961ac662e270a4a30b0bfc2d01 +size 251794 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..b2590a6b65547978da776f6be6538ff175f2da8c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3fc1eb1d821bbd1369388c3c30bc5831a8b5dbaa594321640d278cc34650be +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983391.gamma.3375928.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983391.gamma.3375928.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc362f537557222a0eb91ca7d41f01114f1734f0 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983391.gamma.3375928.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c6a80651a592b4206ed31131e798462b15d55a9e18741e25c8110242c2c507 +size 253414 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..a620599ac7d604125fcda3358fbae637513e3611 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8276c40d502cab5fa0d7502b094126465ae4866f374c4bccacd6e9891428c24 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983570.gamma.3379052.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983570.gamma.3379052.0 new file mode 100644 index 0000000000000000000000000000000000000000..50db33e2b2fe8f04ba1692ce90c33afc19092c10 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983570.gamma.3379052.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518c424dc1076387ea7a604d115a1a72d5bbe72e739658a8726b7332809bd350 +size 167390 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..1abcd5a945531d813fe885c316ba8f42664c7642 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c015a3af77cdf325e53ec78ef01ae5197f64f5ade2844db1cb8bc449f4aa1d66 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983526.gamma.3378141.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983526.gamma.3378141.0 new file mode 100644 index 0000000000000000000000000000000000000000..e816255b6fed5ae35f50138602fd48cb197001de --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983526.gamma.3378141.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b1f33a26bd3f33262361a6388395a6cde67b4e76ac83db4e3239c11c96c3d8 +size 234786 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..a78f82fd585a202bddb2ff955f9e0411c94a4afe --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf97d23e3ee9a0bd1b82d5d6ce5053eb28bfc18e365a4425f6d96b941a7fe84 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983686.gamma.3381288.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983686.gamma.3381288.0 new file mode 100644 index 0000000000000000000000000000000000000000..697496db1dcc632e3dc5699907bda78b39539854 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983686.gamma.3381288.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab48a2b1a4ef93832337fe368ebffd800201e4f8460df499a07106ae73346ae +size 200178 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..27a26cca653895a173f8426f4556bee52f49097c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e7ba4e4ce38888bd9e2716a93f62e3d7c4d12fee91e8a6150c3b6fd76bf32f +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983636.gamma.3380261.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983636.gamma.3380261.0 new file mode 100644 index 0000000000000000000000000000000000000000..d20f11f532913011c600492643580e8647fb4da3 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737983636.gamma.3380261.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2133c3260d616b5b87776b38a52bd90a91ae67f65860da236f8adf8b2884c484 +size 258854 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..83c15f917d377b444b4a2bd412ec0f330895c4f6 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a8813c5cb4bb0107d6ea688944cb0dd2790bcca6675d6452cf21b7e96287cb +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356290.gamma.2231395.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356290.gamma.2231395.0 new file mode 100644 index 0000000000000000000000000000000000000000..46eed9d6f5a9702723b8690f1057b40eb8d7cf68 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356290.gamma.2231395.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6900bba0b544748f575c6d80e5cc0ef18eadd4c2fe5f32f273b904cf1237b1 +size 248274 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..9285e7e45fb1e377b31e8fbb73b8a9f734cd2e54 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c938c35fcdb1efad872e53302d38b7a1182c260f3766e74f2326f5092a3b2432 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356246.gamma.2230505.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356246.gamma.2230505.0 new file mode 100644 index 0000000000000000000000000000000000000000..5cd935e360d798f2a5f15b4fb85163673f1e52eb --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356246.gamma.2230505.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f6d467adec6db898432eb1c61fcd53234efa20b199603e55874f7dbd4de278 +size 260010 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..36fc5a8ca7e2a8bd105ac846ebb2b2a0a29a6e18 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae4d859d9adc2656cbd7a43f7d710ad2c505a55fb7b73f46395ed57dc84b3eb +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356403.gamma.2233536.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356403.gamma.2233536.0 new file mode 100644 index 0000000000000000000000000000000000000000..078faa4856a2032f8e4497cda5f20ce7a34a36f0 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356403.gamma.2233536.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f1a3b5a5fb2c134fd638d2ee7ebbb0aa705e75139297f6e0a040279e640b6ab +size 267510 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..a1de80a7d74f8bb9196413761073eb24074b8dfb --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6c054ef2483b4453a30837cbe6bbdf7d8200493c85906e9e2c68da65ba1b03 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356358.gamma.2232605.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356358.gamma.2232605.0 new file mode 100644 index 0000000000000000000000000000000000000000..d2447a22698898ab9293054596ee66363795fcbe --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356358.gamma.2232605.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ea8007acf02eb211048f45be2d781e4222747faf4cb2a96717638271500f27 +size 269994 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..53b175e72e4528b78741ca1a5e79b9debda586d5 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90dd6b7285d637853ef9e0f19c1e665b86bb1902bbe97115ea29c10f7076a56b +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356572.gamma.2235767.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356572.gamma.2235767.0 new file mode 100644 index 0000000000000000000000000000000000000000..55701d9063f90e1bd456c9fab56ea0788ab790b0 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356572.gamma.2235767.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0fd66b449f133c4a3dcd0a4ffb2fb83f796dbb0f614d7310a0d7b84dc51c19 +size 262294 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..462c5758c7f50b656ad82033f3bd9233f252f1d1 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1719717b0bb7ed0bd63b87ca078ae099d9673cff56eae246f5f6ee4363a98963 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356499.gamma.2234813.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356499.gamma.2234813.0 new file mode 100644 index 0000000000000000000000000000000000000000..711dfe94d007d1f39528898be9a9a1a9dfadf6a1 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356499.gamma.2234813.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60bc72c9d25836e4b99d05c6f33bc4fe8a61fb73c29f0ee398a5559fcbc8c485 +size 264590 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..149a68cc85a7ebe01b063ab101c80360f724a5d2 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4f661f1ce59c696637f00d6ddad9416c6d52ed60896148bafee762e5f6c070 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356682.gamma.2237898.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356682.gamma.2237898.0 new file mode 100644 index 0000000000000000000000000000000000000000..81bc86b680b4553175961498ea497c057ef1bc6b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356682.gamma.2237898.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4c3130ac3da80e30b420b1798c159b0fe9bb17c75aead35873202e4b63770a2 +size 260434 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..9e1da3e48128f7a24700f4176b042af7c2dcbff0 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2f62d036b6fa5c4635e4f7a39b2b755f632e6b3cbfb214448668db96a0b8bb +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356638.gamma.2236984.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356638.gamma.2236984.0 new file mode 100644 index 0000000000000000000000000000000000000000..176a3522fe2e9d802d5c3e47340e1b56ff033492 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356638.gamma.2236984.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14b102ff3da211867a81ea17fc420fcdc54ac4a472984d5a87e5b4231fbe258 +size 262926 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..ec9b8d46066c1751b803dada7d37b1d843d1d72c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2a85a1c79de7c40ddb987c9059d55a57c2fbd083bb13e6808700fc5e583169 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356791.gamma.2240064.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356791.gamma.2240064.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd73ca4186fbb8bcb2ec082fd6778937906ad284 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356791.gamma.2240064.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56d812f3793e7359f1011c1ead01af92212b47a2dec433c11a4b1d791b8d9b1 +size 210790 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..6b1c4bee73a272604a8674cfeabf74e85bb82cff --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed45a947e73520bf503dbcd4fcbeabf13bd459fad387990ce3a534bd5f42f2f0 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356747.gamma.2239142.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356747.gamma.2239142.0 new file mode 100644 index 0000000000000000000000000000000000000000..f83c0723538d545f9946661ceddb46f9dbe3fac6 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735356747.gamma.2239142.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a0a48dd7e23d8a51fd27a788ff68ce80b5094eeaccb1d4af63202520052758 +size 250034 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..26109654465d6e5469fa2946b188fd61c20aa432 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af48b360ed9a1d992583797517f3f10332726d8f28c9d9b46d1ac4111116ed5c +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984275.gamma.3393678.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984275.gamma.3393678.0 new file mode 100644 index 0000000000000000000000000000000000000000..ae4f6783a35751f88a509eda321ddf91d52ed845 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984275.gamma.3393678.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b9edb935233b72b99f9bdf034caa5af94015b8bdf974aa8b4e862be24ed94d +size 259342 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..928a5f48901c69d20852ad415a693d38f3fb1c79 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc7c0409eb1f7d4c7165312d8dc1f1557e16fecca7958555df4b433f4697184 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984228.gamma.3392761.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984228.gamma.3392761.0 new file mode 100644 index 0000000000000000000000000000000000000000..2a6e1ca2de0e48e1ebfd48b8e7b64a6855e24b79 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984228.gamma.3392761.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7a0b86dde0c60cdb36c9b0703688286cd0ca912b0f8de553b305cb47b6befe +size 260198 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..962b0a790837176efc57d45eb61ced1c824eaba7 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfe434a9ed8525c032236a43bb0feafbe16b144a1341918328838d2748274b5 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984423.gamma.3395871.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984423.gamma.3395871.0 new file mode 100644 index 0000000000000000000000000000000000000000..7fc315f2b4d161eab56364fb9db7db28e40250b3 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984423.gamma.3395871.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9263f5d74aed3cbaff28bf377c30d29ccb3b0f7c1b0cbb27e7b6adea367b0e1 +size 249318 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e8ac8c7b1f4312c56cab664efac60f56d7c877ee --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c308a63dd3080118758f211cf8ac1d437c1ba763cc0500bb9e38d6f46a5c3cd +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984361.gamma.3394931.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984361.gamma.3394931.0 new file mode 100644 index 0000000000000000000000000000000000000000..24edf21203cfc06d946304933b4726e07c7165e9 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984361.gamma.3394931.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cef5da0f866ae1a160e7ee00fa1402e30c08dd19a1796b0aae4aaee7cb52cd +size 264970 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..30c20a0331f7fad9cd25f8a99b53f177859ad0f5 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d636209966116cf265ab60160a1da49d854f2a1d2834224b176f48baa0d1293 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984568.gamma.3398058.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984568.gamma.3398058.0 new file mode 100644 index 0000000000000000000000000000000000000000..92d5e11f7a50e1c29cbc325a9d49715d7e30b84d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984568.gamma.3398058.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97cc8cd6205fbd29568531a0723af786a80f75840149dd1432af0b7e99add37e +size 247934 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..d2806f5273e709a9d9a130f748ff92ca41bb3896 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c4d15466f2583afcb89b42b840e022267793d6375d53564ab1149f54d3aeab +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984507.gamma.3397121.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984507.gamma.3397121.0 new file mode 100644 index 0000000000000000000000000000000000000000..550e53c9c2b373ce08f54d76381d06af2752fda8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984507.gamma.3397121.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a94288f8ff7f4df4b6c567f6dcb1cc697c273479f9e0639c7db170a2c4dc3b6 +size 249654 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..60c1c866f786c13673929ac48129a1c13e72cbe8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cee5a0293cf2af15233d9ce713832111ac94641d9d04c5d6a7e025ff0e2fbb4 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984686.gamma.3400233.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984686.gamma.3400233.0 new file mode 100644 index 0000000000000000000000000000000000000000..f842dc77e6066c6fb4e4fd4ba27877d5e41698dc --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984686.gamma.3400233.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c005d688aa7dace71299df075476fbc139ba472a4fff4e9f6989352db7ed3ac1 +size 243938 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..942afc8ce0f6cf5eb54f3081f8ebb758e47765bc --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c797a50124eca7668ef22c43eace25f3a9a28096a2d24b2e7e4e6872636b72 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984638.gamma.3399298.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984638.gamma.3399298.0 new file mode 100644 index 0000000000000000000000000000000000000000..b9f6b435dd469862ec922f21f7e9ced9ea61975d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737984638.gamma.3399298.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f83b81febc5931ea4b256b56f1b6a6702d9862bf3eb42de26e1ed9c3763f73 +size 269518 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..45487af9dc0f4a5a57c7cc0f7ef8cd1b8bc6a777 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523dd67ce2d788c12faae1efc7a225ac06b22b730fc5db3eee97b3239071462c +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736166303.gamma.239655.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736166303.gamma.239655.0 new file mode 100644 index 0000000000000000000000000000000000000000..c184ecfa1fec5d1e8ecae36add4c04730a892d2f --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736166303.gamma.239655.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd300794f54d395cd808df0c5fe9adc02d70e0306ab81e01500a77442883f84a +size 265922 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737985290.gamma.3411207.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737985290.gamma.3411207.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac1ff4c1b2e4eb50c668a2ab0349a8882ddfbe30 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737985290.gamma.3411207.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeabae592a8b4818c4459fe360de15497628347c08d5f2f069c58bdd2bc8a646 +size 267382 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185093.gamma.309438.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185093.gamma.309438.0 new file mode 100644 index 0000000000000000000000000000000000000000..743028f456747418be8f74b8bba44db7ab5cf25b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185093.gamma.309438.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa32b25385870dced88ffa24d4ec87b13357bb414b7ca3eab0432d04a9b2e5b +size 3420 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e82d99092278d77f9d408f131d75dc98ebb41d9b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f30f0a0f2f180be5755c32e696b5d38af624bed2de913ad3371f18354e046d6c +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185049.gamma.308557.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185049.gamma.308557.0 new file mode 100644 index 0000000000000000000000000000000000000000..94464e6f6ba8848abdda40f4998e45a0ec8163be --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185049.gamma.308557.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ef9cd8f0e4342100666fac5271c2be1daf6296fd91036bc98dcae216604111 +size 308690 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..a203ef50d0c750f66c22b823260078e924d6e03f --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7397c782f998b9311c17a6593f319c8398a8f488298074efa6c1cdd4e01a1eb +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185223.gamma.311510.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185223.gamma.311510.0 new file mode 100644 index 0000000000000000000000000000000000000000..5c63f703eb1292c78fa194fa7a7b54d820257616 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185223.gamma.311510.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b6230fe277b7b8f215350cc094b8bece65f627a1fd45f551ffa5fac78f0914 +size 3698 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..8ed47bb617d94c2c10d1ec4b29d12733ada0e761 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605b1a339f5644f746474ff5f8bcce59cc521a4402ab470f50fffbe2e4f9f671 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185173.gamma.310604.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185173.gamma.310604.0 new file mode 100644 index 0000000000000000000000000000000000000000..30dce72134dd6eab0f153a93b9e4a9438eaffedc --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185173.gamma.310604.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa641868467e55a1e5ac96d4ece4b670de14e40b9e6ab906e2d0fb5a62bbc085 +size 309986 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..9fece3eef890c8b5baa3031504ba08bdba364b44 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3d4bb7a8b3976d2826245cf96804a231bbbaa7b378c5233d7e1c3b6d27b371 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185353.gamma.313586.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185353.gamma.313586.0 new file mode 100644 index 0000000000000000000000000000000000000000..00a8e09e1322d07cdd7eff41e0d9f6e03d123b1e --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185353.gamma.313586.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db254ab4ccda73442f1d042c10885cbdb5670bb48b291b97d2f4b70879a5772 +size 3698 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..789159e22fcf4fb23cd95d805201131605fca7a8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f1d3460f5fc8aa701d9fef6fbeaa0452cb9da65c360f09a1c6b03d7805cab8 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185303.gamma.312701.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185303.gamma.312701.0 new file mode 100644 index 0000000000000000000000000000000000000000..b58b913d438884e7a0a74694ec3b05e85fba292c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185303.gamma.312701.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d7f1a91c320addd78fe420fcb71f1ea8491e05c6d68258457eb3144f41c9ce +size 312150 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..511449404c37ba0b082a5f1e0e6eb9d990b56d02 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9928d27b7c4285c0ad54d8245683df13d2f80418113141a845ef752ce590adcb +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185478.gamma.315649.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185478.gamma.315649.0 new file mode 100644 index 0000000000000000000000000000000000000000..62748131b1b31e826b78a8a544141a9a1ede8dd7 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185478.gamma.315649.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ba33ea58cc131f2b3ff7f15a28fd6a9610d721f14beed44160d38efed7a8b0 +size 3420 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..63a64834c5363e874cf045b1efba7d6200989a51 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104134c73c349db4566851282fc45484a034acd040a28ae8955cd1b40f39ef01 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185433.gamma.314765.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185433.gamma.314765.0 new file mode 100644 index 0000000000000000000000000000000000000000..a38e6558afedf2f664f3d45b9bef65f58417cc98 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185433.gamma.314765.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8dcc9ca504cdaad36e2bbb5eeeb729119af56df3233d58304535b69d5f29de8 +size 309526 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..70c4b2cd08bdd23a804db6ab9785f0bb7993f744 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff99054c99070b73ae7ae44e322dcd71b07256a0488edabfa3c6d3f855d6876f +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185608.gamma.317709.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185608.gamma.317709.0 new file mode 100644 index 0000000000000000000000000000000000000000..42ef31b884799bc4936f14f9b7e5917ebf2c81a2 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185608.gamma.317709.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1040b9f587f33ec1b74ef81cc9eb745c04282bd0b9f06686fed1216bb0f62d79 +size 266164 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..69b97354563a9537c5a2e37e797bcc52c20cd37d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ff0c72113a2579079392adb4ce4325682c89b96f89eb6258149019caa5e8c9 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185558.gamma.316815.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185558.gamma.316815.0 new file mode 100644 index 0000000000000000000000000000000000000000..1d147b6af7fd8d8b63dcfdff0bf6c54b1fc00c42 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736185558.gamma.316815.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d262af2a38a49d7e68280b2d11b6998ffeca6cc6bb173caca3cb8160fb4b84d +size 311238 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..fc7e14c2f0eff211c5c44e1046e17fae6efe50f8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6078909edfb7334960e27477bf6c7a59023d4b229373f532d5cc5564b787b7 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986182.gamma.3421734.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986182.gamma.3421734.0 new file mode 100644 index 0000000000000000000000000000000000000000..59bcdca468df1cc390c5528ac6225805b79a53a8 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986182.gamma.3421734.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313c79177bab3ec016eb3ab63c5f533176ce98fbde2936dd414a9941926b1316 +size 3976 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..a97955efcb84b80372486f0fb8c55d40a9b96d50 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31e2721c294ce7f95b6bc955ef2c8b4e8bca5a71afd260f985bc79cb0168269 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986137.gamma.3420798.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986137.gamma.3420798.0 new file mode 100644 index 0000000000000000000000000000000000000000..6efc7daf528549fc3ae4eeb23d7f41746afc3534 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986137.gamma.3420798.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67e91d5e95d578ced11c1500e37aa87cb34c1c82f440259fc4c7a77bb9e8917 +size 313258 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..6730871dd924d8a9aaa1debdf438503042e18d5c --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf77bda77e04e4f1ee0e86f8020902c816b638f047054b1f1b9643e5b2c0355 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986314.gamma.3423960.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986314.gamma.3423960.0 new file mode 100644 index 0000000000000000000000000000000000000000..645b1b593397b2256d66327cad78753e2cabc509 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986314.gamma.3423960.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe15fa545dd328c2a39d324e96aef613f578a98a311ebce5c30c4bb9a1ef3f87 +size 270624 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..38cb32f2848cceefe12aff4b172a39a25afa3dfe --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605e575ca209b0bb3884fed3b57989d2fe9692601583872f37647a6921f85d51 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986264.gamma.3423007.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986264.gamma.3423007.0 new file mode 100644 index 0000000000000000000000000000000000000000..c96b7c247d1d2baccd2327e558929053f5c25030 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986264.gamma.3423007.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e88b52b449900a4effcfa2be8f6452e41a94c3f479516c6f7754d8455f5a43 +size 312478 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..241c13ec8db4c581af2f7f786f08d9d4e0067ad9 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a9b1354e991501e540ef0398ca8de7c523c7534fd2f238220f1b113f1c3e0c5 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986453.gamma.3426194.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986453.gamma.3426194.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5de2d623bef045fb14c8e657bbbeefe289e9dc1 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986453.gamma.3426194.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564dae839f826a2de016fba53f33b32643fbf8aa144926cda2581f95c6b97200 +size 239608 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e69d7c83dea5ddc0a184bdccb76cbee15952aea1 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418d3454ee93e8c5814a4e2a827fdff84df9f79105feab2a3e5ae18599ac1ce2 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986400.gamma.3425234.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986400.gamma.3425234.0 new file mode 100644 index 0000000000000000000000000000000000000000..6fb676776c2857c90343823f53b6f91d7ba88da3 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986400.gamma.3425234.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e41ed436736937b338557d79448081c7210a1f8dbbe63856bfce0811ac11d230 +size 312430 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986591.gamma.3428562.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986591.gamma.3428562.0 new file mode 100644 index 0000000000000000000000000000000000000000..fbd2edb996b42bad23c3184a7af8dc8577331102 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986591.gamma.3428562.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8396b856aab33cb04f441b6b4eeb0fef91681c87e74da44bed93d2ec04538ebf +size 283822 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..173dd244ff6a4acbb86ac7587f802dce560d6fe2 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7cf9bd63f3667afdf91bbaf84aaf1ca00394c84ce220dfe8165b8391a42084 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986539.gamma.3427518.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986539.gamma.3427518.0 new file mode 100644 index 0000000000000000000000000000000000000000..ba7977d1b3f04ab10a2fdde907d4a3d408b81429 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737986539.gamma.3427518.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b2603874c4245ed3071a82e96c19790ade1fea26b434b771e219b9687ed681 +size 308490 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..6d59e9148d477c9ea2925f2785c4d3ff6d849397 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c68f5d13902c10e062e0d0bd4da1111c2ee87bdfe20b67dd55df393749ffd1 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..d520729ea7947fc0478dd87907b7eaa1b4b7f307 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f5a1377f7d93528d2415746f75e22137c6d80ea7137750beebbd7ae58acc74e +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221492.gamma.453338.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221492.gamma.453338.0 new file mode 100644 index 0000000000000000000000000000000000000000..7baf4f8cc76aa48e5b237a6c1a04a9dcdb3cdfa3 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221492.gamma.453338.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2427acb0e0c6a786686589ff5226faa04179de9cf04335392121adeb599bfffd +size 233372 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..5cf02f09f03fbfd05507762f8c885bfb735c597b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c6cf74e568ab714f814eb8fa6c71d9975ab0d5ea4b061e5a8eced72f508a3d +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221434.gamma.452397.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221434.gamma.452397.0 new file mode 100644 index 0000000000000000000000000000000000000000..e1e53d73bf93161432a13159b0ad29a88b9b2e45 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1736221434.gamma.452397.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337e53e86d4236733cf8ac36e3fb8af61c22a1722d20d972d85bc38cb50ab6f6 +size 308318 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..83957d2702922f44f6fc1f9560ec582109d96d29 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475a4415c5fd5a65b6bc2f2cce4325bee5a0edfc9b42247debeb661913c6b3aa +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..03524f9d03b5ad01d35f85be3fa78dc3fb412251 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274a263752259addfcb43b5af067b8acd3566e5913b2d290899042d306b36a4c +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342474.gamma.2090684.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342474.gamma.2090684.0 new file mode 100644 index 0000000000000000000000000000000000000000..d2a9fe1f465b2c794b5c74588ee9512c35cff37d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342474.gamma.2090684.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08e4e20c223a2c2af4351d7db6e3a3e6cf9f230f4503a864988169a2c1fccd3 +size 304822 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..417160caa0ce1e729aa7c798cf79ac45ed48a63f --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aefe136bb53af3709f881795fa05c754a312f9bbfce0722d7af64cf1036fb8c9 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342437.gamma.2089774.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342437.gamma.2089774.0 new file mode 100644 index 0000000000000000000000000000000000000000..9d9ec255ea06465a26a453f7ed645198700d1f7d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342437.gamma.2089774.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2901623159ea425e91380910dd7dad24a8283fc3749fbf8fef33dec79efe2d4 +size 303870 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e5ff393967fd29219343a5d93e3d26e5b0546a0a --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57b6841d250eddd8947a0185e70097639a1215caac549ce39783b0ae75d90b6 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342621.gamma.2092855.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342621.gamma.2092855.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd484c063fd573a0bd4555ab3170b70d50becad6 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342621.gamma.2092855.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d1a15e726afce1ac3d36cd713ab89577c841590d8374b08f2a4002f5be337c +size 312430 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..3d335fa28df903da9ad053fe5c55479ec95cc8ea --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56c18529c26b41861b9a562a036e714174960e511736f11e8509a1c97c2eecf +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342554.gamma.2091900.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342554.gamma.2091900.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec940516a667b63447edd992bbabd1289d49ce09 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342554.gamma.2091900.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7050252726a22ed216c8a35e8cd68606c76eb9294080ff657e7e8facd643a57 +size 312906 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..464bdb4d0dd87a7dcaa41cb50c7cbab2eac8391e --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f20af800f02f126053dff7b2f115f7c92de106a8bd49c1d8bffe40f3734f5b +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342710.gamma.2094927.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342710.gamma.2094927.0 new file mode 100644 index 0000000000000000000000000000000000000000..5595e4402c241880a95acd1751feddb4ef4e352b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342710.gamma.2094927.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3711b5735d3f69f6b09d89984eb389dd76e24c4ee33622835542485344ad2e +size 303958 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..de2848377e52af96d7ea8f6478806f2ff5983552 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e98b44eedf86b74216cde431155155bf94f386e4f0bc45d5b2b2066606608b +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342673.gamma.2094024.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342673.gamma.2094024.0 new file mode 100644 index 0000000000000000000000000000000000000000..d50fed03aeef9e278c2b09f71b773812dfcd9388 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342673.gamma.2094024.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35531be07e787407fd9e3c84455d5608775516617c342b89ad81af2c5bd4ad6 +size 302154 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..f788afaf41a560cf956b324b90ab5f6b5c13dd3a --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391da1f930e7f696c77270be08eef10af4d54c1f7fee8aa452a3d3f5bbc3f51b +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342836.gamma.2097064.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342836.gamma.2097064.0 new file mode 100644 index 0000000000000000000000000000000000000000..afb0aeae4e9284dc69fb11140d9f3e82ae2e0db0 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342836.gamma.2097064.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3224508aa6b562675791e7d87ca51416a9721ec7d2bfea5db01cef17e21b01 +size 310354 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..9b760f5f9e643df123546117da254028823cd233 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8a0c8f372243817824ab1532f5ba73e57cf8f7f7fa94cedb783cbd04b08fc65 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342781.gamma.2096128.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342781.gamma.2096128.0 new file mode 100644 index 0000000000000000000000000000000000000000..eaa0a1ad9144f38d5d9072e2bf5d4f8cf1af9447 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342781.gamma.2096128.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91dbab4264c3d3055a105244ecc8cca0af610db96792978a27ae0732db261d8f +size 310750 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..c0f384ddc8bfb136e9aa6773bf9f0365d7f40134 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679645f397d4010336d61987cd45dd680ef72ba28582b2e0f2e938b9da284be2 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342925.gamma.2099131.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342925.gamma.2099131.0 new file mode 100644 index 0000000000000000000000000000000000000000..b526a3891a77678f7ace57b7cae6c27b04b23194 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342925.gamma.2099131.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081a9e22f67d01f668d27ac58f98ead40d82a9fa9f2f002b28e1c0a379ef1583 +size 311414 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e7e09aa8f3f8965626a6fbe4179cf896798570a9 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd18b1f8b45747f78497eae30bbe60c1889d6ff86463e8653f5b37d519302374 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342888.gamma.2098234.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342888.gamma.2098234.0 new file mode 100644 index 0000000000000000000000000000000000000000..36a3663ef022ead3aab79938386af6a6ca1ceb86 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1735342888.gamma.2098234.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9726994e5dbf01e76ee0d068a8b307237b294a08a4a12a95da60eaa0df6b147a +size 310094 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..6633245b05c33ed1ebdaf0b9e41cafcc537e6c3d --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c02c25dd20b0da371ade707c5c372f45651a219fa4213b82125c4a8a3538a22 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981555.gamma.3346585.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981555.gamma.3346585.0 new file mode 100644 index 0000000000000000000000000000000000000000..a52a25ea51b6271dd7084e6e6a97b8628f6dae89 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981555.gamma.3346585.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abe4b85a1648bcfeda3f7f237d03d7739c52e77dd9689c12010cc8d31f54090 +size 300238 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..d1dcd9aaf32d321fc5b3de96112b687532882e82 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f6385609925c0a42e654d68ea5a68058a431cec520c24cd4b74cc47cb97f5a +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981516.gamma.3345686.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981516.gamma.3345686.0 new file mode 100644 index 0000000000000000000000000000000000000000..d32baf26c3302b8870f00397988ea3e6e8f2a705 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981516.gamma.3345686.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a04fa986d2c8cc305a1847926971cd4280dc098ce7aae1e4b31633d10ae603 +size 300806 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..7cda161c5afd8f4e7fabbd0313db11811384b189 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963683fcbe00d9f8474bd240bdd2b375567c12b9819dff430c88105570be7ee8 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981697.gamma.3348785.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981697.gamma.3348785.0 new file mode 100644 index 0000000000000000000000000000000000000000..232239d87ac61f87f5289808cf345e10fff2e87a --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981697.gamma.3348785.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4ad1af8a87231745281c48e187e28b8b637b9836600542a29bf1b52e98b01b +size 311338 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..e2fe7e36e950b2edab17e51a15fc3343287fd682 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39024cfe01526969420fddac9e3784e13a1a3c5e9ad4ceee70959a3e301c7cc5 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981634.gamma.3347819.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981634.gamma.3347819.0 new file mode 100644 index 0000000000000000000000000000000000000000..94317b183a0c23e0b69eddfc73bf9fb849c65e14 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981634.gamma.3347819.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68f0f1717e5ae9ef2da21bb3c64092102f8917040e4dc43f6128ed3cdaec508 +size 312662 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..f223d4303027fa07e823b913c1e0a68c4f7752a6 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d180b2b4665c4f2e42e77099fa341a333b8a7752d7c3553440ec3d4a14f35d43 +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981829.gamma.3350956.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981829.gamma.3350956.0 new file mode 100644 index 0000000000000000000000000000000000000000..c33800e457e514e0be39154b62b8857fe1124cdb --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981829.gamma.3350956.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c072e490dc573343106b9551eba993e4fe83bce3b16f086e27cec059b1ce4b +size 304922 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..44da3e33390044972a6a7c5a84f73de4cd87e91b --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eddd6d59afbc60c7c875e9318a17b78fdbbe29a005261dc6a3973c1f35d13cf +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981770.gamma.3350007.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981770.gamma.3350007.0 new file mode 100644 index 0000000000000000000000000000000000000000..29bbb159789478f8633e3028b4237e09fc6424e5 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981770.gamma.3350007.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b84921b7e6f2e928e4fb8c9b5ce9fe173b6a9066389947e6234129be0f13a4 +size 305110 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..487dfdd76dd4af34dbf4639947be204bc4ae95bf --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b07a96a7fe40a1f8a7bbff89c9c0ae4b9b264f204c7204daa44b26c3b9021d +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981922.gamma.3353035.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981922.gamma.3353035.0 new file mode 100644 index 0000000000000000000000000000000000000000..5cc0c54d81cf674cfcda20739e39d27250a6144e --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981922.gamma.3353035.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cabdb9899c20d55adf4dd0f8cdfc902e0fce97031936da46e947c0d37a11a0e +size 282502 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..1c890eda4342fafff589d591b2324b863b49d5b4 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c5e9eae92838260276739b7c6c082bda13bc4a00255cba9c37bc6c61eff3ad +size 1740 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981883.gamma.3352130.0 b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981883.gamma.3352130.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7f4ec078904583e313716c63fb223b0aa7e2e16 --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/logs/events.out.tfevents.1737981883.gamma.3352130.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d414ff0c4518a2a52a37b27333c8b884417d6dac04c8f2b3bf3def5dd818eb9 +size 282130 diff --git a/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt new file mode 100644 index 0000000000000000000000000000000000000000..8c5844da78d16695b97dc0cedf33cb3a4e8cc51a --- /dev/null +++ b/lora_plus_tempscaling_trainontest/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/test_400/state.ckpt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dada31965b1c5c209c52d0f3aed623037c6f0a9e461807fcda43ed9af968fb4 +size 1740