Upload folder using huggingface_hub

#304
Files changed (20) hide show
  1. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-100000.pth +3 -0
  2. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-120000.pth +3 -0
  3. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-140000.pth +3 -0
  4. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-160000.pth +3 -0
  5. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-180000.pth +3 -0
  6. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-20000.pth +3 -0
  7. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-200000.pth +3 -0
  8. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-220000.pth +3 -0
  9. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-240000.pth +3 -0
  10. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-260000.pth +3 -0
  11. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-280000.pth +3 -0
  12. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-300000.pth +3 -0
  13. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-320000.pth +3 -0
  14. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-340000.pth +3 -0
  15. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-360000.pth +3 -0
  16. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-380000.pth +3 -0
  17. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-40000.pth +3 -0
  18. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-400000.pth +3 -0
  19. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-60000.pth +3 -0
  20. Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-80000.pth +3 -0
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-100000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28c06064cf863a3474628ceafd6736586ae8ade7e62fa71cc8f46c52884fed67
3
+ size 8140483812
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-120000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2173a9e98ea7e56b2687fa08885d3bf7e935879c1012fcde2ded7ff570dafac7
3
+ size 8140483812
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-140000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c09fdbfbc6804e455d6affe7ea8375a548190af9d1bc080ee6a313237fc66e16
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-160000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de953f2bdac72995063e532ba5a3315619b3e3584da66122dea2734ed39d3889
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-180000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd05416f418c9282b3f6ce8c832eaf93db1b6aca9fe299e0df06e2547575f5ee
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-20000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5553ddfb11ce4c2980abf755ab4363e5314702c976eb561fd4aada81721813be
3
+ size 8140483748
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-200000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4f47efea2ce20df2ae03c14fa5541a6e5d03b16cb87b318b336615f22cf22be
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-220000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38034a660e811364d6a4695fed3bb63e40bb14a8038c14221c38e75ed3a2d88
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-240000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69585b21b4c25a29af6b93c544af1b9e63b13c6bd9725d62cd61fc44d2a6152a
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-260000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bc0d2690867c2e8dadbf20408dc78eac828a747ade7ef4e25f3470536b9875e
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-280000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efc2ffb2cfce6bdbef8ac3841d4bfd05c32ac4c0c36f3ad47265db3be36057bf
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-300000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8d8f626650fd08fbb66d2d9368a702f12c752b187c896d3952d8ec45ac516a7
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-320000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2faa68895bd1ddeaaaf4b3402031f1fd7eccc7413a358f59d893c1c65d04a5f1
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-340000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ffbe45ffece48650e2e2de447cf0acd16a059a9b5e8318c26b4aaea1ce1c170
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-360000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81774ae23928dd37dd906f38b20c6397724fcc6c0ceb225ffde88b61c026d5c4
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-380000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3292d1f3630173f5d497d703cadd603fb1b9fc67fae6f5da75fc0c79b4c7ba78
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-40000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20e04b34216464f70897e8694dbd36bed7273f8f6d0e7ceb7326956642da556a
3
+ size 8140483748
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-400000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd48eac337eab21503aa134532fe55328b2cdd15bcb4184549d5103c5a5a91e
3
+ size 8140483940
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-60000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45e4801446b579fa13e73aaaa0225624e91fc3ecb7c2eb9e2c6a2ebd8b8d770b
3
+ size 8140483748
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly/checkpoint/model-80000.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:882b88b73d10f2ea24d1521a7908c5e1ef51e3182dec442cb56cae135244eb96
3
+ size 8140483812