Add files using upload-large-folder tool
Browse files- .gitattributes +20 -0
- eval_results/global_step_100/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_110/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_120/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_30/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_40/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_50/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_60/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_70/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/global_step_90/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl +3 -0
- eval_results/plots/eval_results_acc_keywords.png +3 -0
- eval_results/plots/eval_results_acc_pass_acc.png +3 -0
- eval_results/plots/eval_results_acc_tokens.png +3 -0
- eval_results/plots/eval_results_avg_stop_tokens.png +3 -0
- eval_results/plots/eval_results_box_ratio_and_token_length.png +3 -0
- eval_results/plots/eval_results_clip_ratio.png +3 -0
- eval_results/plots/eval_results_correct_tokens.png +3 -0
- eval_results/plots/eval_results_repeat_ratio_and_token_length.png +3 -0
- eval_results/plots/eval_results_tokens_keywords.png +3 -0
- eval_results/plots/eval_results_wrong_tokens.png +3 -0
- eval_results_ood/global_step_120/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_120_actor_huggingface/2025-07-14T13-13-03.024786/details_lighteval|gpqa:diamond|0_2025-07-14T13-13-03.024786.parquet +3 -0
- eval_results_ood/global_step_120/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_120_actor_huggingface/2025-07-17T16-25-43.731519/details_extended|ifeval|0_2025-07-17T16-25-43.731519.parquet +3 -0
- eval_results_ood/global_step_80/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_80_actor_huggingface/2025-07-14T12-59-00.847335/details_lighteval|gpqa:diamond|0_2025-07-14T12-59-00.847335.parquet +3 -0
- eval_results_ood/global_step_80/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_80_actor_huggingface/2025-07-17T15-55-01.078366/details_extended|ifeval|0_2025-07-17T15-55-01.078366.parquet +3 -0
- global_step_20/actor/huggingface/model-00001-of-00004.safetensors +3 -0
- global_step_30/actor/huggingface/model-00001-of-00004.safetensors +3 -0
- global_step_30/actor/huggingface/model-00002-of-00004.safetensors +3 -0
- global_step_30/actor/huggingface/model-00003-of-00004.safetensors +3 -0
- global_step_40/actor/huggingface/model-00004-of-00004.safetensors +3 -0
- global_step_50/actor/huggingface/tokenizer.json +3 -0
- global_step_50/data.pt +3 -0
.gitattributes
CHANGED
|
@@ -82,3 +82,23 @@ eval_results_avg32/global_step_80/aime24/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.js
|
|
| 82 |
eval_results_avg32/global_step_80/aime25/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 83 |
global_step_100/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 84 |
global_step_40/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 82 |
eval_results_avg32/global_step_80/aime25/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 83 |
global_step_100/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 84 |
global_step_40/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
global_step_50/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
eval_results/global_step_60/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
eval_results/global_step_70/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
eval_results/global_step_90/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
eval_results/global_step_30/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
eval_results/global_step_100/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
eval_results/global_step_40/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
eval_results/plots/eval_results_box_ratio_and_token_length.png filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
eval_results/plots/eval_results_tokens_keywords.png filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
eval_results/plots/eval_results_clip_ratio.png filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
eval_results/plots/eval_results_correct_tokens.png filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
eval_results/plots/eval_results_acc_pass_acc.png filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
eval_results/plots/eval_results_avg_stop_tokens.png filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
eval_results/plots/eval_results_acc_keywords.png filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
eval_results/plots/eval_results_wrong_tokens.png filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
eval_results/plots/eval_results_acc_tokens.png filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
eval_results/plots/eval_results_repeat_ratio_and_token_length.png filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
eval_results/global_step_50/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
eval_results/global_step_110/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
eval_results/global_step_120/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl filter=lfs diff=lfs merge=lfs -text
|
eval_results/global_step_100/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:221076d5127cd80a6c98e7b988ce29f042772cd816e3dfde1cf77f9e9a6b900e
|
| 3 |
+
size 11380521
|
eval_results/global_step_110/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca9e13d40282e342684aa1ccfe59bc2f3a80cc8a7f8aef4691076fe55d9bc73b
|
| 3 |
+
size 12648344
|
eval_results/global_step_120/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3dcbc96afbf4c6aa0c73a44218fcb014770f32922d57def1a1e3af19d3dc6005
|
| 3 |
+
size 11329116
|
eval_results/global_step_30/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d7d4187910fb7b9dc3a68b107417347f2d5bfcb65e65487058e43b1c4c18ad9
|
| 3 |
+
size 10701349
|
eval_results/global_step_40/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b145a60b2979de04cdc9a796e1a3b2a6046c6fd2c76c601c30e70ee68e1b18ff
|
| 3 |
+
size 10965385
|
eval_results/global_step_50/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:751a8d7f5cc4e9599a52f6a7947cbaeba39e462c3b8ea4e0accccba7edc55ddf
|
| 3 |
+
size 12662531
|
eval_results/global_step_60/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4571fb6f9664b515083a012ca82b4fc9992542a69aaf19fd96993fa8b81f681d
|
| 3 |
+
size 11153588
|
eval_results/global_step_70/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb7417e50f2114558a915a9b047977d4439d018a4a29e4a1f191c77df17f8cf5
|
| 3 |
+
size 12534459
|
eval_results/global_step_90/mmlu_stem/test_qwen-boxed_-1_seed0_t1.0_s0_e-1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5425d2d755be207a95d16428d9cc030e08bfcd6f1d61d1f9f655f74e0670999b
|
| 3 |
+
size 12942646
|
eval_results/plots/eval_results_acc_keywords.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_acc_pass_acc.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_acc_tokens.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_avg_stop_tokens.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_box_ratio_and_token_length.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_clip_ratio.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_correct_tokens.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_repeat_ratio_and_token_length.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_tokens_keywords.png
ADDED
|
Git LFS Details
|
eval_results/plots/eval_results_wrong_tokens.png
ADDED
|
Git LFS Details
|
eval_results_ood/global_step_120/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_120_actor_huggingface/2025-07-14T13-13-03.024786/details_lighteval|gpqa:diamond|0_2025-07-14T13-13-03.024786.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fccf91d4c512fdfa56d8a20e464559c477bd115f65e3346f4a2c63e74799f8a
|
| 3 |
+
size 785001
|
eval_results_ood/global_step_120/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_120_actor_huggingface/2025-07-17T16-25-43.731519/details_extended|ifeval|0_2025-07-17T16-25-43.731519.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b855e79b91f1a7f2975e2de5502b22e3221eb2dbe94e61430b54f3cb5d74e19
|
| 3 |
+
size 2417316
|
eval_results_ood/global_step_80/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_80_actor_huggingface/2025-07-14T12-59-00.847335/details_lighteval|gpqa:diamond|0_2025-07-14T12-59-00.847335.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27082504671739c31f71b9646764956e5809c2aa045eb2f46036c15ccaf6a36a
|
| 3 |
+
size 779776
|
eval_results_ood/global_step_80/details/_home_work_minzijun_rl_output_checkpoints_verl_0.4_grpo_simplelr_math_35_train_Qwen3-8B-base_max_response4096_batch1024_rollout8_vllm_global_step_80_actor_huggingface/2025-07-17T15-55-01.078366/details_extended|ifeval|0_2025-07-17T15-55-01.078366.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ef8c2565150be7c6f1b29016892d7ee5fc72553c11122684ea7ecf3230e04af
|
| 3 |
+
size 2463492
|
global_step_20/actor/huggingface/model-00001-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b61bbecf1872267fefb65aa9536252ab1351a940c1ab69f601ad3f268934852d
|
| 3 |
+
size 4994574152
|
global_step_30/actor/huggingface/model-00001-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1f87e4d6f5650f8afa65e950061886fe3515741599bc634f30dba8432b7cd5e
|
| 3 |
+
size 4373781280
|
global_step_30/actor/huggingface/model-00002-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c2136e2f28a3f172c47ec3bb4abad6f5b37fa07292e7d5f7fa8d435990372ca
|
| 3 |
+
size 4961018016
|
global_step_30/actor/huggingface/model-00003-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:389b5ae626d75d1232c75a36b9ff83b9f79419b5d26bb7f65afb2252ac2c1729
|
| 3 |
+
size 4915893984
|
global_step_40/actor/huggingface/model-00004-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69cb062e4a365442a94d7d85a95dd14d6d8e4bd2b6b5a0c80f2ed6e462c07ef9
|
| 3 |
+
size 1535160824
|
global_step_50/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_50/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93e68dbf80a5a3268306af9e8b54ddf98e6280df8622143714b893455961b820
|
| 3 |
+
size 1492
|