mjf-su commited on
Commit
365c256
·
verified ·
1 Parent(s): 6e8e937

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +11 -0
  2. grpo-nADE-format-RC/checkpoint-100/rng_state_0.pth +3 -0
  3. grpo-nADE-format-RC/checkpoint-100/rng_state_1.pth +3 -0
  4. grpo-nADE-format-RC/checkpoint-100/rng_state_2.pth +3 -0
  5. grpo-nADE-format-RC/checkpoint-100/rng_state_3.pth +3 -0
  6. grpo-nADE-format-RC/checkpoint-100/scheduler.pt +3 -0
  7. grpo-nADE-format-RC/checkpoint-100/tokenizer.json +3 -0
  8. grpo-nADE-format-RC/checkpoint-100/training_args.bin +3 -0
  9. grpo-nADE-format-RC/checkpoint-200/rng_state_0.pth +3 -0
  10. grpo-nADE-format-RC/checkpoint-200/rng_state_1.pth +3 -0
  11. grpo-nADE-format-RC/checkpoint-200/rng_state_2.pth +3 -0
  12. grpo-nADE-format-RC/checkpoint-200/rng_state_3.pth +3 -0
  13. grpo-nADE-format-RC/checkpoint-200/scheduler.pt +3 -0
  14. grpo-nADE-format-RC/checkpoint-200/tokenizer.json +3 -0
  15. grpo-nADE-format-RC/checkpoint-200/training_args.bin +3 -0
  16. grpo-nADE-format-RC/checkpoint-300/rng_state_0.pth +3 -0
  17. grpo-nADE-format-RC/checkpoint-300/rng_state_1.pth +3 -0
  18. grpo-nADE-format-RC/checkpoint-300/rng_state_2.pth +3 -0
  19. grpo-nADE-format-RC/checkpoint-300/rng_state_3.pth +3 -0
  20. grpo-nADE-format-RC/checkpoint-300/scheduler.pt +3 -0
  21. grpo-nADE-format-RC/checkpoint-300/tokenizer.json +3 -0
  22. grpo-nADE-format-RC/checkpoint-300/training_args.bin +3 -0
  23. grpo-nADE-format-RC/checkpoint-400/rng_state_0.pth +3 -0
  24. grpo-nADE-format-RC/checkpoint-400/rng_state_1.pth +3 -0
  25. grpo-nADE-format-RC/checkpoint-400/rng_state_2.pth +3 -0
  26. grpo-nADE-format-RC/checkpoint-400/rng_state_3.pth +3 -0
  27. grpo-nADE-format-RC/checkpoint-400/scheduler.pt +3 -0
  28. grpo-nADE-format-RC/checkpoint-400/tokenizer.json +3 -0
  29. grpo-nADE-format-RC/checkpoint-400/training_args.bin +3 -0
  30. grpo-nADE-format-RC/checkpoint-417/rng_state_0.pth +3 -0
  31. grpo-nADE-format-RC/checkpoint-417/rng_state_1.pth +3 -0
  32. grpo-nADE-format-RC/checkpoint-417/rng_state_2.pth +3 -0
  33. grpo-nADE-format-RC/checkpoint-417/rng_state_3.pth +3 -0
  34. grpo-nADE-format-RC/checkpoint-417/scheduler.pt +3 -0
  35. grpo-nADE-format-RC/checkpoint-417/tokenizer.json +3 -0
  36. grpo-nADE-format-RC/checkpoint-417/training_args.bin +3 -0
  37. grpo-nADE-format-RC/tokenizer.json +3 -0
  38. grpo-nADE-format-RC/training_args.bin +3 -0
  39. grpo-nADE-format/checkpoint-100/rng_state_0.pth +3 -0
  40. grpo-nADE-format/checkpoint-100/rng_state_1.pth +3 -0
  41. grpo-nADE-format/checkpoint-100/rng_state_2.pth +3 -0
  42. grpo-nADE-format/checkpoint-100/rng_state_3.pth +3 -0
  43. grpo-nADE-format/checkpoint-100/scheduler.pt +3 -0
  44. grpo-nADE-format/checkpoint-100/tokenizer.json +3 -0
  45. grpo-nADE-format/checkpoint-100/training_args.bin +3 -0
  46. grpo-nADE-format/checkpoint-200/model-00002-of-00002.safetensors +3 -0
  47. grpo-nADE-format/checkpoint-200/rng_state_0.pth +3 -0
  48. grpo-nADE-format/checkpoint-200/rng_state_1.pth +3 -0
  49. grpo-nADE-format/checkpoint-200/rng_state_2.pth +3 -0
  50. grpo-nADE-format/checkpoint-200/rng_state_3.pth +3 -0
.gitattributes CHANGED
@@ -1048,3 +1048,14 @@ ADEn-TF-KL0/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1048
  ADEn-TF-KL0/checkpoint-292/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1049
  ADEn-TF-KL0/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1050
  grpo-nADE-format/checkpoint-417/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
1048
  ADEn-TF-KL0/checkpoint-292/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1049
  ADEn-TF-KL0/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1050
  grpo-nADE-format/checkpoint-417/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1051
+ grpo-nADE-format-RC/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1052
+ grpo-nADE-format-RC/checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1053
+ grpo-nADE-format-RC/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1054
+ grpo-nADE-format-RC/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1055
+ grpo-nADE-format/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1056
+ grpo-nADE-format/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1057
+ grpo-nADE-format/checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1058
+ grpo-nADE-format/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1059
+ grpo-nADE-format/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1060
+ grpo-nADE-format-RC/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
1061
+ grpo-nADE-format-RC/checkpoint-417/tokenizer.json filter=lfs diff=lfs merge=lfs -text
grpo-nADE-format-RC/checkpoint-100/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ba7e74f7c7ea2d96d8166b8dcb3f01082c866ab87bacee2cf4c7df2741dbf0d
3
+ size 15429
grpo-nADE-format-RC/checkpoint-100/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5208e23389eda366a5f8c04d057490d2ed6290f564b28a914fe0510e4aa03717
3
+ size 15365
grpo-nADE-format-RC/checkpoint-100/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5b694b76d744c7b31eabd27d529ac45e7471189a2b5b674547ab6cdd018031c
3
+ size 15429
grpo-nADE-format-RC/checkpoint-100/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:921b8c5678df42726112db68ba2a311fa8f20f3bcc30c9afd9b11354a54b0a4a
3
+ size 15429
grpo-nADE-format-RC/checkpoint-100/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61d460559cb720beadd3382b1090202d552a46ed3a6a88226cbe15843187a440
3
+ size 1465
grpo-nADE-format-RC/checkpoint-100/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/checkpoint-100/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format-RC/checkpoint-200/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a40a1001a2b07975ae574dff539a4aa15aca4e7d1ccfdbcff73d79459ebb4ff
3
+ size 15365
grpo-nADE-format-RC/checkpoint-200/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b39beed5bb9f4e5e17c5af617b1e31870ad4c4b7b8814144f75ec15f4a9263f
3
+ size 15365
grpo-nADE-format-RC/checkpoint-200/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34a8f2138cf9d5d545b174eb56c59fc17ff6f9728410da2f43efdf26d8507296
3
+ size 15429
grpo-nADE-format-RC/checkpoint-200/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89f7bd42a8fc2c82cdca37b866bd8551372c48cc3239121fa2720978657e1d64
3
+ size 15429
grpo-nADE-format-RC/checkpoint-200/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b26f664df9ea123afdec6d5bc6dfe2a52a3a7ef722b018926d5652844db76dfd
3
+ size 1465
grpo-nADE-format-RC/checkpoint-200/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/checkpoint-200/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format-RC/checkpoint-300/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4301b8c86f477610df5ea36ff648ef1c3d3eb9d448dc4625d072e382c8c5afec
3
+ size 15365
grpo-nADE-format-RC/checkpoint-300/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2616b60494cf20ed7b4c5bf92ec4b248230e5eb404fd5f774ad84c81a6f1d504
3
+ size 15365
grpo-nADE-format-RC/checkpoint-300/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dab2d72368db873383eecfc2fce6cdbf6fae74900077d889bd7d8b83c5fe842
3
+ size 15429
grpo-nADE-format-RC/checkpoint-300/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d526a10e23dd4ef93608fdbc49ff2493543a6f4ccf3aee0920dd58ba088e965
3
+ size 15429
grpo-nADE-format-RC/checkpoint-300/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb1c6111e7614e1dde75357bc4aeac385c5477b97b707cd4b24ed87f968c9360
3
+ size 1465
grpo-nADE-format-RC/checkpoint-300/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/checkpoint-300/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format-RC/checkpoint-400/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1390cc21ca5e0f6f1b86db1c41839377eb0410829a85bef7a33cfa4cb50d1d2
3
+ size 15365
grpo-nADE-format-RC/checkpoint-400/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adfe4b4d9bc81c6da85e901da248ed8f8e995fc460c467cdb6f84c5bf9da5f1f
3
+ size 15365
grpo-nADE-format-RC/checkpoint-400/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c7d79d70782b122cf9c0f3e6e4672e0bc237c14179c9b7791866120fb2d777c
3
+ size 15429
grpo-nADE-format-RC/checkpoint-400/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c34cee1280e2fdeb8333229bff0479e667c386d92ae770f110dfe8f80da416c
3
+ size 15429
grpo-nADE-format-RC/checkpoint-400/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa38db0ee66b5140257894222f100500c67bda119c7b2e36356f905ad7e51ad6
3
+ size 1465
grpo-nADE-format-RC/checkpoint-400/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/checkpoint-400/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format-RC/checkpoint-417/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:964080724c5d51507e080add3b0f664d1e2676a23b328bfa79c580676f81739f
3
+ size 15429
grpo-nADE-format-RC/checkpoint-417/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2571df8e6ae99ded4f8d0f50b8d033aca9e63016921c1813607291c28c5e36
3
+ size 15365
grpo-nADE-format-RC/checkpoint-417/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199b58b39f136b29325192c90104bf964682d9ee0905c5d7425ed03a882a548b
3
+ size 15429
grpo-nADE-format-RC/checkpoint-417/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cb1023c705d0373d9f03bf93b229936c158b054bf08ff3ce38ac3aee7b33288
3
+ size 15429
grpo-nADE-format-RC/checkpoint-417/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fe8646ef7324fdd4b67dccf5069be2bc4cc3430c2a71edea42ce4fd1889cde1
3
+ size 1465
grpo-nADE-format-RC/checkpoint-417/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/checkpoint-417/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format-RC/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21f6994642cfbd8473e43b4fae1d60d4a953aea1419dc28b4ae3f41778cd0924
3
+ size 11422922
grpo-nADE-format-RC/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11edcc29132c3b5adfe5314e8669850619863c55e927d0aba3784738f3cd901
3
+ size 7633
grpo-nADE-format/checkpoint-100/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f86a7c074129e7de804e1410b58a8b5cb02b5fe9142af2e75063ca806c151aa
3
+ size 15429
grpo-nADE-format/checkpoint-100/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:876f17dbc17618e4983d8e1d8e956268bd26af0ab976de82dd1a7f02d25e676d
3
+ size 15365
grpo-nADE-format/checkpoint-100/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48f891dc7eceb52046f622053cb34452b335fb8f491da153774a00011fb19bd4
3
+ size 15429
grpo-nADE-format/checkpoint-100/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f74a26cc1a4a8c2e05c01d00feb8a80b120c300189816294827544002b41f414
3
+ size 15429
grpo-nADE-format/checkpoint-100/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61d460559cb720beadd3382b1090202d552a46ed3a6a88226cbe15843187a440
3
+ size 1465
grpo-nADE-format/checkpoint-100/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67cc0080ffd7555f723f423c27cfef314e1ad9d335c8b79f465c5faba1ed478b
3
+ size 11422821
grpo-nADE-format/checkpoint-100/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1565c485eb001af2dc7b256cffc10af77b60177eda8933b601053faf22369ac0
3
+ size 7569
grpo-nADE-format/checkpoint-200/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97382960c28e69a6c83495571b8ead83e84ec66d3f3309c648e3aa9f030e00f1
3
+ size 3885221448
grpo-nADE-format/checkpoint-200/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff5d8d1ce49fb1658b3af5d59d0d1a90581eb01eaa72ba39f7f13e5247f9a1f0
3
+ size 15365
grpo-nADE-format/checkpoint-200/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41cf4003996112b64d524a6ff3c38ede8f3c82fe49f8699d3f5d8e1ef4e2a171
3
+ size 15365
grpo-nADE-format/checkpoint-200/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bab38b089142ae0571ccd6af3ee6330ef01042d4c28f3252ef8841266de75c98
3
+ size 15429
grpo-nADE-format/checkpoint-200/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f4ad370d126af02fd7b7dfbdca07995e92f44c5a1ea5274403161682aa3edb4
3
+ size 15429