faro1219 commited on
Commit
100e3b4
·
verified ·
1 Parent(s): e7f9bae

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_001000/losses_lr.pt +3 -0
  3. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_001000/norms_lr.pt +3 -0
  4. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_002000/losses_lr.pt +3 -0
  5. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_002000/norms_lr.pt +3 -0
  6. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/losses_lr.png +3 -0
  7. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/losses_lr.pt +3 -0
  8. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/norms_lr.pt +3 -0
  9. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_010000/losses_lr.pt +3 -0
  10. fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_010000/norms_lr.pt +3 -0
  11. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_001000.pt +3 -0
  12. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_006000.pt +3 -0
  13. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_018000.pt +3 -0
  14. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_021000.pt +3 -0
  15. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_022000.pt +3 -0
  16. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_023000.pt +3 -0
  17. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_024000.pt +3 -0
  18. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_025000.pt +3 -0
  19. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_016000.pt +3 -0
  20. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_022000.pt +3 -0
  21. fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_024000.pt +3 -0
  22. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_001000.pt +3 -0
  23. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_003500.pt +3 -0
  24. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_004000.pt +3 -0
  25. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_005500.pt +3 -0
  26. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_007000.pt +3 -0
  27. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_007500.pt +3 -0
  28. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_009500.pt +3 -0
  29. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_000000.pt +3 -0
  30. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_001000.pt +3 -0
  31. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_002000.pt +3 -0
  32. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_003000.pt +3 -0
  33. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_004000.pt +3 -0
  34. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_005000.pt +3 -0
  35. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_006000.pt +3 -0
  36. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_007000.pt +3 -0
  37. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_008000.pt +3 -0
  38. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_010000.pt +3 -0
  39. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_013000.pt +3 -0
  40. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_014000.pt +3 -0
  41. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_015000.pt +3 -0
  42. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_017000.pt +3 -0
  43. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_018000.pt +3 -0
  44. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_019000.pt +3 -0
  45. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_020000.pt +3 -0
  46. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_022000.pt +3 -0
  47. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_023000.pt +3 -0
  48. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_024000.pt +3 -0
  49. fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_025000.pt +3 -0
  50. fineweb-10B/gpt2/eos/sgd/constant/lr_0.06-wd_0.0001-m_0.95-bs_32-seq_1024-iters_9536/250702_163449/checkpoints/step_003000.pt +3 -0
.gitattributes CHANGED
@@ -177,3 +177,4 @@ fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_
177
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/eos/step_025000/combined_eos_analysis.png filter=lfs diff=lfs merge=lfs -text
178
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/eos/step_001000/losses_lr.png filter=lfs diff=lfs merge=lfs -text
179
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/eos/step_003500/losses_lr.png filter=lfs diff=lfs merge=lfs -text
 
 
177
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/eos/step_025000/combined_eos_analysis.png filter=lfs diff=lfs merge=lfs -text
178
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/eos/step_001000/losses_lr.png filter=lfs diff=lfs merge=lfs -text
179
  fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/eos/step_003500/losses_lr.png filter=lfs diff=lfs merge=lfs -text
180
+ fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/losses_lr.png filter=lfs diff=lfs merge=lfs -text
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_001000/losses_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b45cf5e910ffcffb81afca58fe748860192bd1bf1ce3e1e675c162eff0e22f
3
+ size 3575
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_001000/norms_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a515940906bc1d4c768246d64e27a5a7e3757735465cdf59733be534d5b22b6
3
+ size 3568
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_002000/losses_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd27a8ca837b608ec6f3614fc63bc61e182f25f2b94997949502043fa75b0d8
3
+ size 3575
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_002000/norms_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e485b742884ec23554366f53f9f725842997b7cf934f6b8acbb5eaa4e47e9e92
3
+ size 3568
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/losses_lr.png ADDED

Git LFS Details

  • SHA256: 9e3a0ff341eed85d340d6ed9829ee0f74ff92189d6d0fb672d2b1052772e6f04
  • Pointer size: 131 Bytes
  • Size of remote file: 121 kB
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/losses_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31c1f66aaf25cccef12aed41e83e817cb4aed1cea590f9e2bab139f92f7aeee5
3
+ size 3575
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_007000/norms_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17211def3299e895c0e8d9d88c9cad47029c5844bcf2dc3e693ca93b014be3cf
3
+ size 3568
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_010000/losses_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70a38b3a6ed9897004c946ec312b69f5d6841c2b3f02a61cac8ca39c5989b284
3
+ size 3575
fineweb-10B/gpt2/eos/adam/linear/linear-256-2048-15000-0.1/lr_0.0018-wd_0.1-betas_0.9_0.95-bs_32-seq_1024-iters_15000/250622_035242/eos/step_010000/norms_lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31ff8e38650a039885ba6e2d8f6bd3ccd2390150a6d98db5b9b6b51ef93e3c97
3
+ size 3568
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_001000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:581f791ec827e2b336d9f687e19b9e1415831332682702f6fabe4a281ff42acb
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_006000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7061df12b77b3b9b5df6e08e1ff16b1d88188d7552003d52186cbda9a50de5c4
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_018000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d1bc4ac24eec284ef4242de349d3981cda8fe519d32550c976aa990afa21ab8
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_021000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:130d2bcae971d70d23e22545d0a2bb2d4f2b7c42664350958e7604d43c2eaa37
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_022000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51849bfa5b0f78afdcea5dff2036442a3c86a070a919c585f8ec81ec436b4f11
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_023000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12f4164bad305b8a02dd7b39552feeb8317c5706788c4c4785befd71ceaaa435
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_024000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d00bd52f8b2028b576a106ab3dde5a1ce2e23b10b77a9f95647997b48426dbbe
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250730_000401/checkpoints/step_025000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b20dff63d44fbcee77bd0c4989145e37bb2a219606f6e76bb0baba9e223ea54
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_016000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80e462008010f39e5c114e9219240b6070f60fdb550398c90cdff95f1a69715a
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_022000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1236ea7170f272a12a56a4f27486d086994aa9c2d15bdd83121ab162935e4ed6
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.01-wd_0.0001-m_0.98-bs_32-seq_1024-iters_25000/250730_022725/checkpoints/step_024000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36784e29ce772f4c5f93992073cb4255458be1cef9c7697304498bf9185b8924
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_001000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203aad999bd05a913b30accf499818e75dce07c48ac90a8f16faa63c2ceaf68b
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_003500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c9b64f045978413a8fba8d402112ce97d545e96a7be7869e73822070b805aca
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_004000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efa40822968d1380e7f164129b36fe4a3f0c5a15934828cca428e97db7733931
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_005500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b30e82e1e8e81e6b38b0b3b19a7c48dc0183305a37190309ae7fd14939d94c68
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_007000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6fd14e23dedce640e1741687e02fb0581b242ab7cb48d7a72ef5316ded67f4c
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_007500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7afdb34bc5ca64dab9e8ee7b34bbc4cf3428eec96c471d0855a6ee49a2a40fbe
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.0-bs_32-seq_1024-iters_9536/250622_011417/checkpoints/step_009500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f2a30db2f8924ec6354fcf0dfe3262444e46ef197b78d9ac9d8ea43b43078a0
3
+ size 648821973
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_000000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aabdd09acc5b62e5e5d5db14a64bbabb6abbf4d317cbd71586f216789f529a79
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_001000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41606eac264c2bdfffb1be001b3da354b969dba111b20d3aacc0f8ccfebd1a14
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_002000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cba2bdccb4a2578232493b90568d0b388eb041d91c7759c324162e896805214
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_003000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6190cba24e14507d20f7551a13df43b7d7445863f7de1f3bc9635ed3ace2486
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_004000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af277026895b518859222979fd7f6b52aed9966b637e5a957b87af90c2f1f5dc
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_005000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54060533c57addb7a25087dbea440717f773ca8ee998efa1820b729c5d38e6a
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_006000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58706634ea5f18cad2b11f810f378b91453027202e85d645146fd1a4ae27494d
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_007000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a7eb6e26bfe1c8bc208c941b81aa58d05dec75396b29236a6722a52f63f7023
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_008000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1097a4fa65ab13da10f3e51a0ad500e030f7dcd7bf738f9397adfe85edae5b1f
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_010000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:040efc888b7d2b3aa6368334dfceed53bc1ceb391665b0b60933aba0837a0859
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_013000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67913a3cc27a7ef67ecd6ebf6871cc1bfc4545fe89f674e50a3622ef529446be
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_014000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b10469afa9f03c302e7c3683ebf046701161e0093c4ba872887f885f1ec6ae52
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_015000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d2f49c396f10184510511c04d1612136d2346c6c64cc6c93e54d28073d609fe
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_017000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97169153364a3968ff481425961624e46bd8fbc3d240428eb67966bc66822eb7
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_018000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:214330c363ed2c20f307408b07e521f7ca8bd2bfc5fb574f99584d839e44a66a
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_019000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54aaf8990033639264a13bb495494294e366b705638b80b6b3c4fddec7b8da6b
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_020000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b438479d03d90312ee866349d7bb334ad9cc3554ccc1484a0bbfa23258b5ce7
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_022000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3375eb1ab2da45e9b8b17322fee824bba7c82ed6868df9eba2c5fccdeba107c7
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_023000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c52ebc03bd780c64a3f76f255dc4a356bf32ca21973d4c8e38d3d81c7e68185
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_024000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:426c27142843ea8280de2a09d69ea492be75382011168eae96d446577d7477dd
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.03-wd_0.0001-m_0.95-bs_32-seq_1024-iters_25000/250729_212048/checkpoints/step_025000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2f4be880e089960cf832a8f30a0cf56530f9194b634ae4f08ed1744c4d44127
3
+ size 1297616507
fineweb-10B/gpt2/eos/sgd/constant/lr_0.06-wd_0.0001-m_0.95-bs_32-seq_1024-iters_9536/250702_163449/checkpoints/step_003000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9148c49891ccdaf172d347687f00cacdabdaccd194f1d972687b0ff5b7f03821
3
+ size 1297607995