4b892c845d1e773a514c28d88e36caa762e050f2929936953b8e47aed369f25d
Browse files
sft/1M3/Full_smoe_tcmoe/checkpoint-13786/model-00003-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:146a99928674488c4a8958c19a9e6cf490736a3b99eacd2a4c77cd63d10fa95f
|
| 3 |
+
size 248971200
|
sft/1M3/Full_smoe_tcmoe/checkpoint-13786/model.safetensors.index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_size":
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"lm_head.weight": "model-00003-of-00003.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_size": 10207220352
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"lm_head.weight": "model-00003-of-00003.safetensors",
|
sft/1M3/Full_smoe_tcmoe/checkpoint-13786/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sft/1M3/Full_smoe_tcmoe/checkpoint-13786/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88a0753fdff97eef6a658f2b2cf4c8afea9a83a6ca1601c10ad020270039b677
|
| 3 |
size 7992
|