Add files using upload-large-folder tool
Browse files- Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_128/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_256/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_192/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_512/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_192/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_256/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_512/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_320/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
- Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_128/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f195fe1da778c32c2451fd488d4fa1b2df71e41b6c2cfd49fb6774c01c837ae5
|
| 3 |
+
size 4973610584
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_256/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:838aa332345304574b0ab7329f32f966a3d8eb90ae5222ad98be9e448d037323
|
| 3 |
+
size 4821120184
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_192/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffa4da8162c7218467b08d2f825cdfe14363670c163f61ed3853f755706711ca
|
| 3 |
+
size 4984680248
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_384/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:736f356d7cb6fcd36adba376ec8d8628aabe702018ef5f7c0451f776be51c442
|
| 3 |
+
size 4731468832
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_512/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d79a266c6e97e6d3295eb1a8b3b32d7523be0079135448a51bfaf3a8e70d4bc
|
| 3 |
+
size 4959520672
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_64/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8ea4a034b460f21bfa6c70e251b429e204140b77594e6c95a299a70b6456ad4
|
| 3 |
+
size 4953222576
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_192/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2ca4b12066f1390818e993275b1211a7d94f673359d255fae6fb5a21f2d3ee9
|
| 3 |
+
size 4978375752
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_256/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86c33778a9e2f27d38010b9c0807952865573d26264670f2600ebc8d82edbc7d
|
| 3 |
+
size 4967330816
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_384/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c652b14dcaa8e56893d9c26f7bd3af48f6dc4bc50f0b4cc24f129591310b805
|
| 3 |
+
size 4959513760
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_384/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:338ee1b132a164feedcd02f0b1e95f6b140a8fb0de52ffac87bac8c837cb8d28
|
| 3 |
+
size 4992510208
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_512/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be7fe9681c0cd3c73814ebfb90410cde8a5e9f7c34320f8b91ca4538a8c4f08f
|
| 3 |
+
size 4751901080
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_64/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e80a2882b5567bf245b40a08327c680fad08bc1fad410cd24e19756b15269799
|
| 3 |
+
size 4978413896
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_320/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b8603fd3b086a3ccf556f5f00841bd494602ce69057aac6423f7deb5bf8f82f
|
| 3 |
+
size 4997280952
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_64/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52143ee2b0300b95bf0b81b0708be8d4dbf7464206b9689de449313edaabc8a0
|
| 3 |
+
size 4990983120
|
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_384/actor_hf/model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1eb429af38e83f0387c7b55e9e9f068c13411f7acca2349d201bf95e04ec2acb
|
| 3 |
+
size 4997262544
|