Upload 114 files
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- model/backbone.pt +1 -1
- model/config.json +2 -2
- model/layer_01_moe_expert_001/model_001.pt +1 -1
- model/layer_01_moe_expert_001/model_002.pt +1 -1
- model/layer_01_moe_expert_001/model_003.pt +1 -1
- model/layer_01_moe_expert_001/model_004.pt +1 -1
- model/layer_01_moe_expert_001/model_005.pt +1 -1
- model/layer_01_moe_expert_001/model_006.pt +1 -1
- model/layer_01_moe_expert_001/model_007.pt +1 -1
- model/layer_01_moe_expert_001/model_008.pt +1 -1
- model/layer_01_moe_expert_002/model_001.pt +1 -1
- model/layer_01_moe_expert_002/model_002.pt +1 -1
- model/layer_01_moe_expert_002/model_003.pt +1 -1
- model/layer_01_moe_expert_002/model_004.pt +1 -1
- model/layer_01_moe_expert_002/model_005.pt +1 -1
- model/layer_01_moe_expert_002/model_006.pt +1 -1
- model/layer_01_moe_expert_002/model_007.pt +1 -1
- model/layer_01_moe_expert_002/model_008.pt +1 -1
- model/layer_01_moe_expert_003/model_001.pt +1 -1
- model/layer_01_moe_expert_003/model_002.pt +1 -1
- model/layer_01_moe_expert_003/model_003.pt +1 -1
- model/layer_01_moe_expert_003/model_004.pt +1 -1
- model/layer_01_moe_expert_003/model_005.pt +1 -1
- model/layer_01_moe_expert_003/model_006.pt +1 -1
- model/layer_01_moe_expert_003/model_007.pt +1 -1
- model/layer_01_moe_expert_003/model_008.pt +1 -1
- model/layer_01_moe_expert_004/model_001.pt +1 -1
- model/layer_01_moe_expert_004/model_002.pt +1 -1
- model/layer_01_moe_expert_004/model_003.pt +1 -1
- model/layer_01_moe_expert_004/model_004.pt +1 -1
- model/layer_01_moe_expert_004/model_005.pt +1 -1
- model/layer_01_moe_expert_004/model_006.pt +1 -1
- model/layer_01_moe_expert_004/model_007.pt +1 -1
- model/layer_01_moe_expert_004/model_008.pt +1 -1
- model/layer_01_moe_expert_005/model_001.pt +1 -1
- model/layer_01_moe_expert_005/model_002.pt +1 -1
- model/layer_01_moe_expert_005/model_003.pt +1 -1
- model/layer_01_moe_expert_005/model_004.pt +1 -1
- model/layer_01_moe_expert_005/model_005.pt +1 -1
- model/layer_01_moe_expert_005/model_006.pt +1 -1
- model/layer_01_moe_expert_005/model_007.pt +1 -1
- model/layer_01_moe_expert_005/model_008.pt +1 -1
- model/layer_01_moe_expert_006/model_001.pt +1 -1
- model/layer_01_moe_expert_006/model_002.pt +1 -1
- model/layer_01_moe_expert_006/model_003.pt +1 -1
- model/layer_01_moe_expert_006/model_004.pt +1 -1
- model/layer_01_moe_expert_006/model_005.pt +1 -1
- model/layer_01_moe_expert_006/model_006.pt +1 -1
- model/layer_01_moe_expert_006/model_007.pt +1 -1
- model/layer_01_moe_expert_006/model_008.pt +1 -1
model/backbone.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2322241
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:259a3fb2b1b104ba59167966c9a8d29264cf596ec2a510c1eb75db719ab453d2
|
| 3 |
size 2322241
|
model/config.json
CHANGED
|
@@ -8,7 +8,7 @@
|
|
| 8 |
"num_moes": 6,
|
| 9 |
"num_experts": 8,
|
| 10 |
"batch_size": 32,
|
| 11 |
-
"max_iters":
|
| 12 |
"eval_interval": 50,
|
| 13 |
"eval_iters": 20,
|
| 14 |
"lr": 0.0003,
|
|
@@ -16,7 +16,7 @@
|
|
| 16 |
"model_dir": "model"
|
| 17 |
},
|
| 18 |
"vocab_size": 67,
|
| 19 |
-
"step":
|
| 20 |
"stoi": {
|
| 21 |
"\n": 0,
|
| 22 |
" ": 1,
|
|
|
|
| 8 |
"num_moes": 6,
|
| 9 |
"num_experts": 8,
|
| 10 |
"batch_size": 32,
|
| 11 |
+
"max_iters": 750,
|
| 12 |
"eval_interval": 50,
|
| 13 |
"eval_iters": 20,
|
| 14 |
"lr": 0.0003,
|
|
|
|
| 16 |
"model_dir": "model"
|
| 17 |
},
|
| 18 |
"vocab_size": 67,
|
| 19 |
+
"step": 750,
|
| 20 |
"stoi": {
|
| 21 |
"\n": 0,
|
| 22 |
" ": 1,
|
model/layer_01_moe_expert_001/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d331e61f34324c69e428c16fc9ee88d55a02dbca245fcefcddc1141497024216
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68e41d48120d08dfe452d4890f9955164694f157c1281b9126d30e98a0a7358c
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76c268dd46f06d1b4de1545e4d727557774a29a80f997df47d561df7118c5bf8
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0ff3eb8ba74414ad9c893e710b8eeb92d9195a8f543e1ca7060e99c0075b179
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04817af0e04f4f59e8fdfa817f6b49d5422864ae51f9bc721a403ebe42355bdc
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4955f67c754c75130c1201aa149672850a58ec707731ffb305bfcf134169216f
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abb061b1569dff2519c137e6a385af1f0a778eb055ee19d7f4fc738d6af081b4
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_001/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4247a64ebf4aae15952c16063ced16028b53edd604d25f69b8e0589c7680c10e
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e30ce0dba6fc24ac29f3effeb2abc47220fb48cc600c6186060716e6c4a66cfe
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce238a05def8b77bbeafd6bfaa4e1e322e75586a24e5c172bb5a249193fd82c6
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:264063cb9314f0241006af1ac88ad93a07b1cdc21a65426f620e295cf69b3257
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8bf276b975043d189a4442d81a4b7fd9ed1773a1cee95d5fc3dc8f7aa7c0d4b9
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6108a1484e1b6081645a9bd3d08c714fc995d6b16542d92514e6b798cdee015
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69691479777a31a9fa13495b8a0f0a38ef54543dd1357317807ea9786f6adbee
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c736630477c0e5b8258bf10942669c1debb7659f2ff3053529bb1544d62a88a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_002/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69b61936fa6bd51eed48e5bc8208d60de00fafce2ea26bd5b4e036ccc3e73544
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6b89c8f29f31b3656077763880677f9f2b7a0652b2b02665ed618801d75baac
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecb884280c3a91970211c0a5fb39edac1a005f88b7800ba6cee329a60ccd2f4a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d94bdbf562135dad80e6954057ac6a17d6063ba2d7e7a186ced39fd664328772
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6021452f61f0fe77801681d3b35d36ac4f55d404462408430d3d7f9759e23e5f
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0c8a515ab32220092938cef85f4abc3103298a156ed4cecb30b05096689ea77
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f19e695021a169a773d5739771885d81d9112c254c411681284193084748d57
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b252b2ada4cf7bd9efa466cbfdc42bef816d9ab43bb04fa162d4c6f07f265893
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_003/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12bcdd010bda128ce95a9b681093d71d8ef3c3f01fe39c62a275e272f2f9609b
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4c6432cfea3a8cea2eadbb00eec765fe526b3cc30a2d2c2ab5a12c196c35a78
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90c56a2e58ce2b25741e79d2359388ed9a56d14e7159a281502a634b6f055f10
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fc137366c28a7cc78351d894928d2333cb3aa67add8907b46a55cd05cffda7c
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:499bf113b3402b1aeea0c948b1a93553224c4bad99202d30557120da7d1e0429
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7c9df94f6f2d0ce1c974ce060088c5c8ca0155e57b316097d9edb8d024c7f5a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b28319093fc767085640399e094d644cfce7749904da89534b2871b1d8bc3d1c
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:940d83f85c919ebca82ba140383ea03f8b56e8ed1057164fd1d7cae218a01202
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_004/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:472d18529b163b9b1efbe48668bb0ed3248b08afa94a0f0d1ac8de8308e1b836
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86a329717886db069f9ede6e3b2acbf6cfc0d6e5ff581d938733d54bdf858819
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2884a96b5bd13e824cc72e20e7b1666a925036615c1797be5b793a1252a1f9
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc095250ea182b963168322dcfa0084508b5cb6f3f7e04e36d05fb2a6b8150d4
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6f21f593a2f6b38af2167be6a8758d6371a7e641739e477baf2dab5572ee156
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5de98a0e062fdcde825b0a8ed1693c67a3c7a966c210c64df3c048c724687dd
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9d156c673921ac74b23e612a23117e1f4c910d3dcc74fd49e4701bfe47ac2a7
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69a5996fcd83f6e1ad5991f315f22dcde351262bcb2da91c14d90a325f9ba657
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_005/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9c6fe128f683d872272485bea9b6e54f97e95f14413220af199a11cf4601b68
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_001.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0892976c92e5009d868745c2a500f6672ae068e07a8342cc24f30bab347fd27a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_002.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6545f429bc9d25acff7627cfb165ea2e539bd974d1b2a23c3bc5ebf93244fb2a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_003.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:322eed71b1698aa9b972a8bf88643c72568d46036881cbe890575758a24a4ea1
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_004.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e074baa45df4707bb3773489ab4e853085d0decd0b13667ee3975206450a4fb
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_005.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ccf41f7559f50e8caa5a8f10cd6db4c5f531da7bec5b1e55707daee116a7d53
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_006.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b874e6f9e23ebb764bf9c582e30370fd81e45cc3a46233e7567893456e17467a
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_007.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9b7eaa517662447828c2e8fa2a10d1e4018ac413aba92e708c98995b3bf9dec
|
| 3 |
size 2104881
|
model/layer_01_moe_expert_006/model_008.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2104881
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6d9bad35fd0eb284e2326906895204f88ce19208957749256717a967b964036
|
| 3 |
size 2104881
|