Upload folder using huggingface_hub
#271
by
DavidNguyen
- opened
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-100000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-120000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-140000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-160000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-180000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-20000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-200000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-220000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-240000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-260000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-280000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-300000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-320000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-340000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-360000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-380000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-40000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-400000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-60000.pth +3 -0
- Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-80000.pth +3 -0
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-100000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16a95f41d17724716f016acf69cd7f609baeaecad285d68ed152ca01de64ccb9
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-120000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9dff30dbb337163b98242e72d8254bef40ad481e4b61351ea23014efce006b18
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-140000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb7e0ed218a280d6fd2090beb9a0fe6da718674bc817f45551eb51839c140f1b
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-160000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26c8589a2a14572f95f2a577ed90f5ad5c0affcbfe3eb7c3f173b66f45108923
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-180000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b51ed0f450bf291459972f135d6d40eaccf1ce81428dfd274069377dd87225fd
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-20000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f4f73fd84654b5d8acbea670c9ea1ea04f179d4f3b3696ee5d97157531cff93
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-200000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d14067107c384ad289a959b927228c1c2286d5e808bd097661ae6f3ed6b2f99c
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-220000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:158b8e1b34ae5207399edff97036112da88dc05e1cb4fe08c155926de6cdd031
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-240000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a8f3fae86e0e5b42f01f2b6d4d68481061e6b2a33bf0a86d1af0ea10e27a41d
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-260000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af1a3891493c8b108edf9e32a4ccc8887adcb959917a7a064faca17a228451e4
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-280000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2199d301d5f866055d0cb3ef07276bd99db1fdcf8ab9288b5fb42f8889fa889
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-300000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bc0eedb5e0aca9bd80e70cb09c0823fda8829aada3fbcf9fe0f4cdcd2a1253d
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-320000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:759522c022e6ed5cccc3b8e88e20d94e8c3c26917872c7f4e054e1c7a22b33dc
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-340000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e29e3e26f9b9b9dd1b2d8a415b9796ed5522662d059f2cef4c209bd37b847b9
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-360000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cc0e7c67f6b91da2fa58c19699da1befffc0a3e9f22a3972589e9fa5fb9e583
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-380000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b56c81eed9b7c8ab2fd68238f7a0cd7aa2fc2115ff811f7718f199121b465be8
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-40000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84d2016c109626b2af0fa338649b7c54cc751b51064ffb5d83e41c93dd934b9c
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-400000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d4ac3770a0964bb9e6fb8f75761fe40038b421da3db8517c2d015f523985d63
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-60000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91b5dcaab5e7785c28ddbde62bb123ce88b883bcf58ccab5ac4a8f83e9aa1c6d
|
| 3 |
+
size 8140483620
|
Pretrain_language_model/save_final/slimpajama_moe_no_attmoe_660M_standardlb_deepseek_sigmoidonly_v2/checkpoint/model-80000.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c4299a6c97cbbb42d99fe395774aade63d17b5629a5ac5a0fe1e8824f5512af
|
| 3 |
+
size 8140483620
|