Add files using upload-large-folder tool
Browse files- .gitattributes +10 -0
- eval_results_ood/global_step_80/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_80_actor_huggingface/2025-08-20T21-48-46.935565/details_extended|ifeval|0_2025-08-20T21-48-46.935565.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T18-03-43.749603/details_extended|ifeval|0_2025-08-20T18-03-43.749603.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T18-03-43.749603/details_lighteval|gpqa:diamond|0_2025-08-20T18-03-43.749603.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T20-28-04.073795/details_extended|ifeval|0_2025-08-20T20-28-04.073795.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T20-28-04.073795/details_lighteval|gpqa:diamond|0_2025-08-20T20-28-04.073795.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T21-43-47.552890/details_extended|ifeval|0_2025-08-20T21-43-47.552890.parquet +3 -0
- eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T21-43-47.552890/details_lighteval|gpqa:diamond|0_2025-08-20T21-43-47.552890.parquet +3 -0
- global_step_10/actor/huggingface/model.safetensors +3 -0
- global_step_10/actor/huggingface/tokenizer.json +3 -0
- global_step_10/data.pt +3 -0
- global_step_100/actor/huggingface/tokenizer.json +3 -0
- global_step_100/data.pt +3 -0
- global_step_20/actor/huggingface/tokenizer.json +3 -0
- global_step_20/data.pt +3 -0
- global_step_30/actor/huggingface/tokenizer.json +3 -0
- global_step_30/data.pt +3 -0
- global_step_40/actor/huggingface/tokenizer.json +3 -0
- global_step_40/data.pt +3 -0
- global_step_50/actor/huggingface/tokenizer.json +3 -0
- global_step_50/data.pt +3 -0
- global_step_60/actor/huggingface/tokenizer.json +3 -0
- global_step_60/data.pt +3 -0
- global_step_70/actor/huggingface/tokenizer.json +3 -0
- global_step_70/data.pt +3 -0
- global_step_80/actor/huggingface/tokenizer.json +3 -0
- global_step_80/data.pt +3 -0
- global_step_90/actor/huggingface/tokenizer.json +3 -0
- global_step_90/data.pt +3 -0
.gitattributes
CHANGED
|
@@ -62,3 +62,13 @@ eval_results_ood/global_step_10/details/_home_work_compass_innovation_minzijun_c
|
|
| 62 |
eval_results_ood/global_step_0/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_0_actor_huggingface/2025-08-20T21-36-38.816189/details_extended|ifeval|0_2025-08-20T21-36-38.816189.csv filter=lfs diff=lfs merge=lfs -text
|
| 63 |
eval_results_ood/global_step_10/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_10_actor_huggingface/2025-08-20T20-20-53.516588/details_extended|ifeval|0_2025-08-20T20-20-53.516588.csv filter=lfs diff=lfs merge=lfs -text
|
| 64 |
eval_results_ood/global_step_10/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_10_actor_huggingface/2025-08-20T21-30-26.010784/details_extended|ifeval|0_2025-08-20T21-30-26.010784.csv filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 62 |
eval_results_ood/global_step_0/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_0_actor_huggingface/2025-08-20T21-36-38.816189/details_extended|ifeval|0_2025-08-20T21-36-38.816189.csv filter=lfs diff=lfs merge=lfs -text
|
| 63 |
eval_results_ood/global_step_10/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_10_actor_huggingface/2025-08-20T20-20-53.516588/details_extended|ifeval|0_2025-08-20T20-20-53.516588.csv filter=lfs diff=lfs merge=lfs -text
|
| 64 |
eval_results_ood/global_step_10/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_10_actor_huggingface/2025-08-20T21-30-26.010784/details_extended|ifeval|0_2025-08-20T21-30-26.010784.csv filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
global_step_10/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
global_step_100/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
global_step_20/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
global_step_30/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
global_step_40/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
global_step_50/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
global_step_60/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
global_step_70/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
global_step_90/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
eval_results_ood/global_step_80/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_80_actor_huggingface/2025-08-20T21-48-46.935565/details_extended|ifeval|0_2025-08-20T21-48-46.935565.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c2203ee878c41394f24d9515efd9c5b6d07284195ce9006c27c55bdbe318145
|
| 3 |
+
size 1286597
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T18-03-43.749603/details_extended|ifeval|0_2025-08-20T18-03-43.749603.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb715b76416500380f7fa14665c44dfbaf722122420565724c1e78439cc101b9
|
| 3 |
+
size 1287943
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T18-03-43.749603/details_lighteval|gpqa:diamond|0_2025-08-20T18-03-43.749603.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31cba75e84dcba95cf3200c4a92e5a311a5919183e86fd926b9f103bdaedf995
|
| 3 |
+
size 740664
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T20-28-04.073795/details_extended|ifeval|0_2025-08-20T20-28-04.073795.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86576718eaf5298ced10f680d659e147ee28fd2ec0bab2f6dc6d0c442a0a609c
|
| 3 |
+
size 1230970
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T20-28-04.073795/details_lighteval|gpqa:diamond|0_2025-08-20T20-28-04.073795.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f161a40db9f0f113736301987f6e7c131e7a88aaded9654a75749f9def9d9e86
|
| 3 |
+
size 711359
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T21-43-47.552890/details_extended|ifeval|0_2025-08-20T21-43-47.552890.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da60cba5dce1305d35e892f29faeb7fd0596825d51c6717b6d721de79706fb64
|
| 3 |
+
size 1230970
|
eval_results_ood/global_step_90/details/_home_work_compass_innovation_minzijun_checkpoints_verl_role_sft_grpo_deepmath_train_sample_6144_context_4k_Qwen3-1.7B-base_max_response4096_batch1024_rollout8_vllm_True_bias1.5_global_step_90_actor_huggingface/2025-08-20T21-43-47.552890/details_lighteval|gpqa:diamond|0_2025-08-20T21-43-47.552890.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f161a40db9f0f113736301987f6e7c131e7a88aaded9654a75749f9def9d9e86
|
| 3 |
+
size 711359
|
global_step_10/actor/huggingface/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f9131f8ee80a57cb7c3db3a77f2be329eb04c6baa95094a17cd51c6753d09bb
|
| 3 |
+
size 4063515640
|
global_step_10/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_10/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aae9cac0f48798a4167cb59dc3be01018f3b002fa92413d0d684d6aab802248c
|
| 3 |
+
size 1947
|
global_step_100/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_100/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc54cc54a2ae27bcb749f03791d68574003beaeac89e301216cd08481afb0166
|
| 3 |
+
size 1947
|
global_step_20/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_20/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fec3eef973f024013ff9e53830cf1ec34af7e525911b64ab819235c7976f7d0d
|
| 3 |
+
size 1947
|
global_step_30/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_30/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e24cf7e13052deb8f18db6c09cb86b369fe04864ae21ed87dc42829ad10a9e5a
|
| 3 |
+
size 1947
|
global_step_40/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_40/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37f844bd43d239b679f610c60d464ce1d2f071bb27f66867de02d17db6a772ba
|
| 3 |
+
size 1947
|
global_step_50/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_50/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93a9191ddeece333cb9640bc2f326b62e3eee0e127c70deca1ea6cce70e81fff
|
| 3 |
+
size 1947
|
global_step_60/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_60/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efbbb2217cd9d765107abc2e5227e1243b259be52cc2d672b7b30676a24b23c6
|
| 3 |
+
size 1947
|
global_step_70/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_70/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f87b7d97b67ae821087ff43fb7fbebd7fce80d386b85214b53949b5f6bfa1ece
|
| 3 |
+
size 1947
|
global_step_80/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_80/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50640094f4ad1fd03a7afc9526e3a0c5d87c34d5e9c227c66bda96072c84df70
|
| 3 |
+
size 1947
|
global_step_90/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
|
| 3 |
+
size 11422654
|
global_step_90/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e950e65d778d1d88512086d9d16dab084a2da6c68cc2f1a55963580303f2b00e
|
| 3 |
+
size 1947
|