DatPySci commited on
Commit
d29b9f4
·
verified ·
1 Parent(s): 623ff10

Add files using upload-large-folder tool

Browse files
Files changed (15) hide show
  1. Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_128/actor_hf/model-00001-of-00002.safetensors +3 -0
  2. Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_256/actor_hf/model-00001-of-00002.safetensors +3 -0
  3. Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_192/actor_hf/model-00001-of-00002.safetensors +3 -0
  4. Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
  5. Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_512/actor_hf/model-00001-of-00002.safetensors +3 -0
  6. Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
  7. Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_192/actor_hf/model-00001-of-00002.safetensors +3 -0
  8. Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_256/actor_hf/model-00001-of-00002.safetensors +3 -0
  9. Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
  10. Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
  11. Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_512/actor_hf/model-00001-of-00002.safetensors +3 -0
  12. Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
  13. Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_320/actor_hf/model-00001-of-00002.safetensors +3 -0
  14. Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_64/actor_hf/model-00001-of-00002.safetensors +3 -0
  15. Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_384/actor_hf/model-00001-of-00002.safetensors +3 -0
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_128/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f195fe1da778c32c2451fd488d4fa1b2df71e41b6c2cfd49fb6774c01c837ae5
3
+ size 4973610584
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_256/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:838aa332345304574b0ab7329f32f966a3d8eb90ae5222ad98be9e448d037323
3
+ size 4821120184
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_192/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa4da8162c7218467b08d2f825cdfe14363670c163f61ed3853f755706711ca
3
+ size 4984680248
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_384/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:736f356d7cb6fcd36adba376ec8d8628aabe702018ef5f7c0451f776be51c442
3
+ size 4731468832
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_512/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d79a266c6e97e6d3295eb1a8b3b32d7523be0079135448a51bfaf3a8e70d4bc
3
+ size 4959520672
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_64/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8ea4a034b460f21bfa6c70e251b429e204140b77594e6c95a299a70b6456ad4
3
+ size 4953222576
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_192/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ca4b12066f1390818e993275b1211a7d94f673359d255fae6fb5a21f2d3ee9
3
+ size 4978375752
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_256/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c33778a9e2f27d38010b9c0807952865573d26264670f2600ebc8d82edbc7d
3
+ size 4967330816
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_384/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c652b14dcaa8e56893d9c26f7bd3af48f6dc4bc50f0b4cc24f129591310b805
3
+ size 4959513760
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_384/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:338ee1b132a164feedcd02f0b1e95f6b140a8fb0de52ffac87bac8c837cb8d28
3
+ size 4992510208
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_512/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7fe9681c0cd3c73814ebfb90410cde8a5e9f7c34320f8b91ca4538a8c4f08f
3
+ size 4751901080
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_64/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80a2882b5567bf245b40a08327c680fad08bc1fad410cd24e19756b15269799
3
+ size 4978413896
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_320/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b8603fd3b086a3ccf556f5f00841bd494602ce69057aac6423f7deb5bf8f82f
3
+ size 4997280952
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_64/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52143ee2b0300b95bf0b81b0708be8d4dbf7464206b9689de449313edaabc8a0
3
+ size 4990983120
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_384/actor_hf/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eb429af38e83f0387c7b55e9e9f068c13411f7acca2349d201bf95e04ec2acb
3
+ size 4997262544