Upload folder using huggingface_hub
#263
by
DavidNguyen
- opened
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-100000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-120000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-140000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-160000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-180000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-20000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-200000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-220000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-240000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-260000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-280000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-300000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-320000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-340000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-360000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-380000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-40000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-400000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-60000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-80000.pth +3 -0
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-100000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72535e11139334f5dca22cdee38d66d089478a7abc29540d76698ac34ea6fb97
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-120000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01af2b494ef6fdec15c51b981ca6105dad1cccd25dca331a468913d3194c7307
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-140000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5da30d41b91272bcdb480a267b106607c989895cbd6ae553b90963f01f96823f
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-160000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e86af9ae09c23e04d660c6b37d25c242bfdd62c0d07247d7e9818880518430b
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-180000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ca9373e30c3977bdf8081347546bc3052cdde0a3227a6979aaa360bf4b4abcd
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-20000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f500200b375ef00fc590017257300bee6ff2bc16738831f6cbb076d321b7a90
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-200000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55b3a5c09413fde8097b9071512e8b46de6855b880f868c6543ad611a46d2005
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-220000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:476656eb789b01259c8ccfef3d5a2c888cca3ad9057a49ae051af4e647972ee0
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-240000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87434d0ee8e962f39ab5f06fd91cac0936894ee710a936ec987480a56aaeb316
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-260000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d1969cfffef852ec550744bfb28aed16e7e84612ee72a7d10a1d27bd3d1c920
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-280000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa8ed54bfa7d6c7a07f24729b1af8db3cc6d06362b625452fae5dea2a06b58e0
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-300000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b325ebdcbb16c34f705aec4d99746c5dbae63fd1aa29c5ff2d5326ad7657561
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-320000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:278d8404406019402fbee054e654c2b5ec75174b235ac8feed0ece72ae2d5720
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-340000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76f92cfece3bc4e99db43c13fec20f0ab171a1585b19db5d5709897f012d7375
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-360000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20681d8661591f76e32d575e063f7cf9024bf2854d6f67963d78dfe0ebe15441
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-380000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e619cadd7283af5156e2c623669438bde1e97e98a4cb785886b1df858d4f41d
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-40000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fac404862be6f8475bc8e49fcd8b28e911dceec178bb8fe861bbe0527631954
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-400000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d63f023f05a5f4c8300e71f3276f31836b2ceb30ee325245cefcb60ddff5e73
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-60000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f48f11bcab6ded7ab3824136968cc2d71881e86a72201ae494a0871898304629
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_shared_only/checkpoint/model-80000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b672ab874206560b8f88bc8b1bfb13afa75f70f1d2721170cd2a5da94371b769
|
| 3 |
+
size 8140483620
|