Escapist-X commited on
Commit
df4ea19
·
verified ·
1 Parent(s): 0e6652a

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +3 -0
  2. output_grpo_dr/checkpoint-1000/model-00001-of-00002.safetensors +3 -0
  3. output_grpo_dr/checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  4. output_grpo_dr/checkpoint-1000/rng_state_0.pth +3 -0
  5. output_grpo_dr/checkpoint-1100/model-00001-of-00002.safetensors +3 -0
  6. output_grpo_dr/checkpoint-1100/tokenizer.json +3 -0
  7. output_grpo_dr/checkpoint-1300/model-00002-of-00002.safetensors +3 -0
  8. output_grpo_dr/checkpoint-1400/model-00001-of-00002.safetensors +3 -0
  9. output_grpo_dr/checkpoint-1400/model-00002-of-00002.safetensors +3 -0
  10. output_grpo_dr/checkpoint-800/model-00001-of-00002.safetensors +3 -0
  11. output_grpo_dr/checkpoint-800/model-00002-of-00002.safetensors +3 -0
  12. output_grpo_dr/checkpoint-800/rng_state_3.pth +3 -0
  13. output_grpo_dr/checkpoint-900/model-00001-of-00002.safetensors +3 -0
  14. output_grpo_dr/checkpoint-900/tokenizer.json +3 -0
  15. output_grpo_dr_3d/checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  16. output_grpo_dr_3d/checkpoint-1100/model-00002-of-00002.safetensors +3 -0
  17. output_grpo_dr_3d/checkpoint-1100/training_args.bin +3 -0
  18. output_grpo_dr_3d/checkpoint-1200/model-00002-of-00002.safetensors +3 -0
  19. output_grpo_dr_3d/checkpoint-1300/model-00002-of-00002.safetensors +3 -0
  20. output_grpo_dr_3d/checkpoint-900/model-00002-of-00002.safetensors +3 -0
  21. output_grpo_dr_geo/checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  22. output_grpo_dr_geo/checkpoint-1050/model-00002-of-00002.safetensors +3 -0
  23. output_grpo_dr_geo/checkpoint-1050/rng_state_0.pth +3 -0
  24. output_grpo_dr_geo/checkpoint-1050/rng_state_1.pth +3 -0
  25. output_grpo_dr_geo/checkpoint-1050/rng_state_2.pth +3 -0
  26. output_grpo_dr_geo/checkpoint-1050/rng_state_3.pth +3 -0
  27. output_grpo_dr_geo/checkpoint-1050/scheduler.pt +3 -0
  28. output_grpo_dr_geo/checkpoint-1050/training_args.bin +3 -0
  29. output_grpo_dr_geo/checkpoint-1100/model-00002-of-00002.safetensors +3 -0
  30. output_grpo_dr_geo/checkpoint-1150/model-00002-of-00002.safetensors +3 -0
  31. output_grpo_dr_geo/checkpoint-1200/model-00002-of-00002.safetensors +3 -0
  32. output_grpo_dr_geo/checkpoint-1200/rng_state_2.pth +3 -0
  33. output_grpo_dr_geo/checkpoint-1200/rng_state_3.pth +3 -0
  34. output_grpo_dr_geo/checkpoint-1200/training_args.bin +3 -0
  35. output_grpo_dr_geo/checkpoint-800/model-00002-of-00002.safetensors +3 -0
  36. output_grpo_dr_geo/checkpoint-850/model-00002-of-00002.safetensors +3 -0
  37. output_grpo_dr_geo/checkpoint-900/model-00001-of-00002.safetensors +3 -0
  38. output_grpo_dr_geo/checkpoint-900/model-00002-of-00002.safetensors +3 -0
  39. output_grpo_v3/checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  40. output_grpo_v3/checkpoint-1100/model-00002-of-00002.safetensors +3 -0
  41. output_grpo_v3/checkpoint-1200/model-00002-of-00002.safetensors +3 -0
  42. output_grpo_v3/checkpoint-600/model-00002-of-00002.safetensors +3 -0
  43. output_grpo_v3/checkpoint-700/model-00002-of-00002.safetensors +3 -0
  44. output_grpo_v3/checkpoint-800/model-00002-of-00002.safetensors +3 -0
  45. output_grpo_v3/checkpoint-900/model-00002-of-00002.safetensors +3 -0
  46. output_grpo_vcs/checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  47. output_grpo_vcs/checkpoint-1000/rng_state_0.pth +3 -0
  48. output_grpo_vcs/checkpoint-1000/rng_state_1.pth +3 -0
  49. output_grpo_vcs/checkpoint-1000/rng_state_2.pth +3 -0
  50. output_grpo_vcs/checkpoint-1000/rng_state_3.pth +3 -0
.gitattributes CHANGED
@@ -66,3 +66,6 @@ output_grpo_dr_geo/checkpoint-900/tokenizer.json filter=lfs diff=lfs merge=lfs -
66
  output_grpo_dr_geo/checkpoint-1100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
67
  output_grpo_dr/checkpoint-1300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
68
  output_grpo_dr_geo/checkpoint-950/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
66
  output_grpo_dr_geo/checkpoint-1100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
67
  output_grpo_dr/checkpoint-1300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
68
  output_grpo_dr_geo/checkpoint-950/tokenizer.json filter=lfs diff=lfs merge=lfs -text
69
+ output_grpo_vcs/checkpoint-800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
70
+ output_grpo_dr/checkpoint-900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
71
+ output_grpo_dr/checkpoint-1100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
output_grpo_dr/checkpoint-1000/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e194b502b35d8cf154572b65fd3c02644ea203f473bb07fa190727df0f4993c
3
+ size 4997750760
output_grpo_dr/checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bd2606f79dfd46fd5aef49abcd0dabb5b56dad78d4dfc26bf4d6a1579dbd11a
3
+ size 4204299316
output_grpo_dr/checkpoint-1000/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f9b46cee676bdd2bf7522f0082670475aca22bccf15f6cef761b1a4b902cc54
3
+ size 15429
output_grpo_dr/checkpoint-1100/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:680cbc117738b7559a3df4afc3db6ab34b297c0657aaf0cb6bbe556b7869210c
3
+ size 4997750760
output_grpo_dr/checkpoint-1100/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eee858c5123a4279c3e1f7b81247343f356ac767940b2692a928ad929543214
3
+ size 11422063
output_grpo_dr/checkpoint-1300/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:395d886210c9f759d7dfbd559d62b783e1497bfced612a2aa428693ece65d127
3
+ size 4204299316
output_grpo_dr/checkpoint-1400/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22900eb85b9ca4757de0b48ebca0f674cffcbd767a989e8e50cf5ab7c41a467e
3
+ size 4997750760
output_grpo_dr/checkpoint-1400/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3d886e1902b69d655a7eb636de9ae5746954a66707087036a83aa5ac8eaf629
3
+ size 4204299316
output_grpo_dr/checkpoint-800/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83c42575cdc827b10e1c31541ab5dffdb003d98bcd6daafb550d5dbdfe7310f1
3
+ size 4997750760
output_grpo_dr/checkpoint-800/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ad2221c6cb65b24aa642ff7241f9fb126919dcfed1e05b387f49477403483de
3
+ size 4204299316
output_grpo_dr/checkpoint-800/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b71359733974895f411b76eaaec3dabaf0dbbd6d3fd108072540478fe7fb2cb0
3
+ size 15429
output_grpo_dr/checkpoint-900/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a25508ebbabb8ba17f52ba6526b137be22b258e8e757ae17ad0bd8766266908
3
+ size 4997750760
output_grpo_dr/checkpoint-900/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eee858c5123a4279c3e1f7b81247343f356ac767940b2692a928ad929543214
3
+ size 11422063
output_grpo_dr_3d/checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:812b28d1f5ff46c84c9e976d30ec925fe01936115cea4a1b369715dc573351b4
3
+ size 4204299316
output_grpo_dr_3d/checkpoint-1100/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f137a8dfd2f50c4a32764fd64b73f8f977f238351cf2b0b2fbc187d4126a08a
3
+ size 4204299316
output_grpo_dr_3d/checkpoint-1100/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afa311557cf9efa2f86bc63bb87a85e7f7bcfcd9f525399a1083327afb0d1234
3
+ size 7185
output_grpo_dr_3d/checkpoint-1200/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db34d623762be96ee8a82648b2b67ea8d994102a68d1ed0eb0b4dd1a290c72f
3
+ size 4204299316
output_grpo_dr_3d/checkpoint-1300/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d3f3a5710118f504e6e5c79157d5f48ac685f79d552c48a7472819daaa57a9
3
+ size 4204299316
output_grpo_dr_3d/checkpoint-900/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21477957c2422b5d265e2feee010b20fbc70b2a0cc30ca7c4033540659a9dc21
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d036e0cc91b64b2023d4dad4664b511c95b63c2e26121f87d8155825948c7d3
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1050/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa4a0f99ddc9a15e67aefc0cda51633781e062e91f6c44b61f0a80cfdc6dde0a
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1050/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31b33507d8634b3f7dd88f30a5d4d39d09bdc5dbe6a33a0162004750328dc4dd
3
+ size 15429
output_grpo_dr_geo/checkpoint-1050/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9577ef2adffc61e7bbde2be5f38d3a40a7ad9e1dfd4f5170a61b03c0c6f775c8
3
+ size 15365
output_grpo_dr_geo/checkpoint-1050/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb7060a4eaa3a6c201a967338f576de35103d38ff7078322757e78fa8dbc71ec
3
+ size 15429
output_grpo_dr_geo/checkpoint-1050/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2dd0592fada6c4df6c221ec8101e1c38b96b85e4f91a1fc9eb2df6d379f61a
3
+ size 15429
output_grpo_dr_geo/checkpoint-1050/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dce64762b314982b19e68f949b6f2a9c28cf6dd5c771b583b7098dbe7f964cdc
3
+ size 1465
output_grpo_dr_geo/checkpoint-1050/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47fe018114038aef2d75bbd35b63d2812436ef8380fbe46f60e29543723244e5
3
+ size 7185
output_grpo_dr_geo/checkpoint-1100/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc6d71293b9d90598277a4a15271e91e1d7d25626821e6793c19dfe00f688e74
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1150/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a4746fa9302233585f13b9990ff7fb61545d72b7b38369d44462cbd9f0e0d68
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1200/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfb202fdac7faaf2043ccec84d2746ad759b10bbc78f3bf0425bef90d67fdf6
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-1200/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d2b4dfff288e8a303da4165a47d8cc83ece40dbcdcef9ff6252e508b663f7a
3
+ size 15429
output_grpo_dr_geo/checkpoint-1200/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08845f606ae0bdcc61c8535761d7ef0f71600926136c75502716429ee926c6bb
3
+ size 15429
output_grpo_dr_geo/checkpoint-1200/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47fe018114038aef2d75bbd35b63d2812436ef8380fbe46f60e29543723244e5
3
+ size 7185
output_grpo_dr_geo/checkpoint-800/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc6a6121d7f94fd179f539752b5134d3fb44f541cc2950c0f8c332bd47141631
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-850/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8c60a3f8d4a5f4e3259d5341931432141e325ece5a23416560d4cb1937372e
3
+ size 4204299316
output_grpo_dr_geo/checkpoint-900/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbd9d26bde97931d33635203af820ebdf14564deae71810c80045f626463ba57
3
+ size 4997750760
output_grpo_dr_geo/checkpoint-900/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:312cf7ac29731fe7cbf36cc1ee0c76c9273291efc3838869d28ff743a357be49
3
+ size 4204299316
output_grpo_v3/checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2eb0db124deee70474117a2f527a4833c67e526569a0f11da09ec966aec22b9
3
+ size 4204299316
output_grpo_v3/checkpoint-1100/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da80d04212f507a88738d8b9b25a044646e0544101f30133c368c580b7c8722b
3
+ size 4204299316
output_grpo_v3/checkpoint-1200/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10eac37087c1719383bf8b2f57ca8b8476964f381f65340750cf6ab3658ab958
3
+ size 4204299316
output_grpo_v3/checkpoint-600/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ae078dfb65f3aeb16985c61a7bbb6df0bc9a76a16c19e9f0e635a978ebc3931
3
+ size 4204299316
output_grpo_v3/checkpoint-700/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5584681f78f300e67ded9397f69982da0d6e2e43c8c042848232c0215d179767
3
+ size 4204299316
output_grpo_v3/checkpoint-800/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddcca8cb180b508536f7be7435b94b832eb04b5d0c75fde82fddb1320f68a0f8
3
+ size 4204299316
output_grpo_v3/checkpoint-900/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e161cc76b723d1174d702cbc696c8e62925bde2a0678300e5a11c26b77a1702
3
+ size 4204299316
output_grpo_vcs/checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c305b272613431249456c001a923ac1c8c2c6a5fb2bc0faaca8e2bddc2acbf35
3
+ size 4204299316
output_grpo_vcs/checkpoint-1000/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1facbdecf0f3bd3f1acdda7dc42ad63975720c125c1b60cd38c940926a7fe50
3
+ size 15429
output_grpo_vcs/checkpoint-1000/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4c449e9aabba782fbfedfdef9a6e898ec404173ae53a600626e2f38ff22de96
3
+ size 15365
output_grpo_vcs/checkpoint-1000/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60aa7dfeed0ea8fbad3bf9afcf8e9f0380633a9b0a92a7145642379499eecd27
3
+ size 15429
output_grpo_vcs/checkpoint-1000/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6e8f9e9f0c6afbf5a50507f45caa36792331c4821a4481a7b0f558f4a6761d6
3
+ size 15429