Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +14 -0
- csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/rng_state_2.pth +3 -0
- csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/rng_state_3.pth +3 -0
- csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/adapter_model.safetensors +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/optimizer.pt +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_0.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_1.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_2.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_3.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/scheduler.pt +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/adapter_model.safetensors +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/optimizer.pt +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_0.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_1.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_2.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_3.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/scheduler.pt +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_0.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_1.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_2.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_3.pth +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/scheduler.pt +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/optimizer.pt +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_0.pth +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_1.pth +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_2.pth +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_3.pth +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/scheduler.pt +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/rng_state_2.pth +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/scheduler.pt +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/tokenizer.json +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/training_args.bin +3 -0
- csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/tokenizer.json +3 -0
.gitattributes
CHANGED
|
@@ -37,3 +37,17 @@ csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/to
|
|
| 37 |
gsm8k__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
gsm8k__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
gsm8k__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
gsm8k__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
gsm8k__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
csqa__qwen3_8b__t1t2_s1_80_20_half_bare_ss/lora/sft/checkpoint-723/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
gsm8k__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
csqa__qwen3_8b__t1t2_s1_80_20_half_bare_ss/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5001f16e2075ef4f6a1c0dbc75d9121e1906a36d5ad35279fed02e36a6c7d13
|
| 3 |
+
size 15429
|
csqa__llama3_8b_instruct__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1251/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe81d2a38e1b3446b2df91d7799fbc8c80087f959e47b7cab7b5bb0fc6db3501
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7652a39324b207397ee4d922416f3094a71e5e1104edd9d6726812cd32caab9e
|
| 3 |
+
size 87360584
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ece94509f4d6054083bf10e31bcb99b0f2d8deccf094dd8f4dba7638bd4f190e
|
| 3 |
+
size 175012683
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eee49a2ad561e75c5f0f3e8056308fc27088e19e19620813602767a759d8e5a
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e34c5da13614815d740bb91790974fffad60cd4e1e61540d824668f639ceb8c4
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5001f16e2075ef4f6a1c0dbc75d9121e1906a36d5ad35279fed02e36a6c7d13
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:734ee5c970cbb54b0278472ea265d91b0b55d7c50d7efaf4e23a0d3f44c70a5a
|
| 3 |
+
size 1465
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/checkpoint-1251/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68ddf7de1570616bffc40d1c9cd3c31fc35afbc4f528db4dd991d2993b4791e2
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_all_variants/lora/sft/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68ddf7de1570616bffc40d1c9cd3c31fc35afbc4f528db4dd991d2993b4791e2
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c58121393e57fbee812e322e74ce32e441d66f9166c1b0f3317324aa98a018c8
|
| 3 |
+
size 87360584
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2969dff06dd2da81a95404ae898053762828d30716ff13fe5e5a4a2fe2b6ccbb
|
| 3 |
+
size 175012683
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eee49a2ad561e75c5f0f3e8056308fc27088e19e19620813602767a759d8e5a
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e34c5da13614815d740bb91790974fffad60cd4e1e61540d824668f639ceb8c4
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5001f16e2075ef4f6a1c0dbc75d9121e1906a36d5ad35279fed02e36a6c7d13
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88e2f19d069dccc536b4cbc782e2bea5ee08d71cb26d4844b07c19bfbd75a06f
|
| 3 |
+
size 1465
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/checkpoint-375/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14ce3c8facf8f09c4de7672ebf68dae1f8eaf431df5531e5c8b5ff39b8b21001
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_bare_100/lora/sft/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14ce3c8facf8f09c4de7672ebf68dae1f8eaf431df5531e5c8b5ff39b8b21001
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eee49a2ad561e75c5f0f3e8056308fc27088e19e19620813602767a759d8e5a
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e34c5da13614815d740bb91790974fffad60cd4e1e61540d824668f639ceb8c4
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5001f16e2075ef4f6a1c0dbc75d9121e1906a36d5ad35279fed02e36a6c7d13
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50d264908855be7b75ed889f9dde1345bcdb0afa3b2d8ead87139ea4577267cf
|
| 3 |
+
size 1465
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/checkpoint-750/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ce0e9ff323cf334dbb374cfdd9be99c4e74f1d84b9f80691f1d9a376abe9ee1
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s0_half_bare_ss/lora/sft/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ce0e9ff323cf334dbb374cfdd9be99c4e74f1d84b9f80691f1d9a376abe9ee1
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:582bde9d8ffdaf8ade37a91aefcb49789b72af183db769f35ec2d7c6efd030e6
|
| 3 |
+
size 175012683
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eee49a2ad561e75c5f0f3e8056308fc27088e19e19620813602767a759d8e5a
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e34c5da13614815d740bb91790974fffad60cd4e1e61540d824668f639ceb8c4
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5001f16e2075ef4f6a1c0dbc75d9121e1906a36d5ad35279fed02e36a6c7d13
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04b5fc03714e867d91def6c1cfc52245fcf84d5b1ed53382766793296d3f2a14
|
| 3 |
+
size 1465
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/checkpoint-1083/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5911790eebe84ff8b794c2c50e9ee062d8df5a9a173e7e20817879e2a1c74d8
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s1_80_20_all_variants/lora/sft/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5911790eebe84ff8b794c2c50e9ee062d8df5a9a173e7e20817879e2a1c74d8
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84cf36eb77e76f4d60fcc92f3755828769fe8aab6a2ca29f9573827e93d0c9f5
|
| 3 |
+
size 15429
|
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88e2f19d069dccc536b4cbc782e2bea5ee08d71cb26d4844b07c19bfbd75a06f
|
| 3 |
+
size 1465
|
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/checkpoint-375/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5684aa4750d240de4dab90afe99030ce927aab815505eb8b149034a160d51f92
|
| 3 |
+
size 6161
|
csqa__qwen3_8b__t1t2_s1_80_20_bare_100/lora/sft/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|