Upload folder using huggingface_hub
Browse files- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_0.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_1.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_2.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_3.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_0.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_1.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_2.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_3.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_0.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_1.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_2.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_3.pt +1 -1
- planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/data.pt +1 -1
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_0.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15077
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:766a1cebb346f9c9433166fef12b6868a22e629b80c588eb4187c34acada72dc
|
| 3 |
size 15077
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_1.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15077
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48b5c7b90ce0f4a509dfc562300603255eeef992804cc0d4475b3cf433b88273
|
| 3 |
size 15077
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_2.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15077
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f194f73b1d29812dad2b4c402899e3f82dcf27ddbed830184db0741b4cf5cf4f
|
| 3 |
size 15077
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/extra_state_world_size_4_rank_3.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15077
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e1b9969d25b8a5896e23f86fd28b29293983366563f34c1f4baa68eb24bd27f
|
| 3 |
size 15077
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_0.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7615805455
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0969622371d9abc9af9ff23ddb6d050eec33cadad92d15e3fd9970189a67ad4
|
| 3 |
size 7615805455
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_1.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7615805455
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:991cda288e435425ecdd98af8f626bbc9a5c4d1d4ecfbbc0d33b0cde867fec83
|
| 3 |
size 7615805455
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_2.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7615805455
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6866a8e3d47633ec7975cbf13286a2926b74757c99e4aa6c89b0dbf832fe47e8
|
| 3 |
size 7615805455
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/model_world_size_4_rank_3.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7615805455
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75cf2648c2f5e2d8348ea9ae970714ff986e60fc1b09a90987f4683e47ad940f
|
| 3 |
size 7615805455
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_0.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15231259716
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86ed083fc300760f72d29cf473b077ccae557d145e6d803cfb2ed1719066b2b0
|
| 3 |
size 15231259716
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_1.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15231259716
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f55c6ce5edd7253a68c56f212b8d346fe95c471c221cf4bb2aa354518415d19a
|
| 3 |
size 15231259716
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_2.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15231259716
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffffa68ba6cadff1a8e575ac8289f23fd8545edd8af3af0fbf3051ad427cc349
|
| 3 |
size 15231259716
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/actor/optim_world_size_4_rank_3.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15231259716
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f837483661a6a0d9f7ff5726f408acf4187d1218d5ac77813e75b4f9631115e3
|
| 3 |
size 15231259716
|
planning_2509_DeepSeek-R1-Distill-Qwen-7B_grpo/data.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1947
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c296fb8b9a8d13076408bcc47ac54057b7604c18abe105123f604d98b6bed08c
|
| 3 |
size 1947
|