Commit
·
563d6f7
1
Parent(s):
4292bd5
Upload part 22
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +40 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_7.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_13.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp4147714852658976211.~1663960300471661~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9555357449403213209.~1663960300683715~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp11486611230450486738.~1663960300987305~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp1218504712848670488.~1663960300551362~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp12210499250334949315.~1663960300551781~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp13342057397051974412.~1663960300730328~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp13871929988687534989.~1663960300864701~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp16009143535501472492.~1663960301024973~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp6305613955940868417.~1663960300685131~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/.zarray.__tmp1396208861180522139.~1663960300554631~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp11929326860362079676.~1663960300500846~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1245922900176289008.~1663960300384432~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1577452788764155663.~1663960300309792~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1962892791003305179.~1663960300425311~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp4960023367428288268.~1663960300504905~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp7760782348285584253.~1663960300777117~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp9690779028244793549.~1663960300501480~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.0 +3 -0
.gitattributes
CHANGED
|
@@ -1157,3 +1157,43 @@ checkpoint_1007000/target.decoder.layers_19.mlp.wi_1.kernel/0.2 filter=lfs diff=
|
|
| 1157 |
checkpoint_1007000/target.decoder.layers_19.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1158 |
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1159 |
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1157 |
checkpoint_1007000/target.decoder.layers_19.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1158 |
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1159 |
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1160 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1161 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1162 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1163 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1164 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1165 |
+
checkpoint_1007000/target.encoder.layers_14.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1166 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1167 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1168 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1169 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1170 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1171 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1172 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1173 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1174 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1175 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1176 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1177 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1178 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1179 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1180 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1181 |
+
checkpoint_1007000/target.encoder.layers_17.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1182 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1183 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1184 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1185 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1186 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1187 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1188 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1189 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1190 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1191 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1192 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1193 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1194 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1195 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1196 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1197 |
+
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1198 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1199 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_10.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_13.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (14.7 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp4147714852658976211.~1663960300471661~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9555357449403213209.~1663960300683715~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac74bb1e4064f5bc5e2545215e89b6ca1e92172654308fc4541ae0599d91a8a1
|
| 3 |
+
size 7830871
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cff347f263e2cfad4eecf8ad8ada1c0261abf02d006634d66c60a6997f06a85d
|
| 3 |
+
size 7805561
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp11486611230450486738.~1663960300987305~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp1218504712848670488.~1663960300551362~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp12210499250334949315.~1663960300551781~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp13342057397051974412.~1663960300730328~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp13871929988687534989.~1663960300864701~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp16009143535501472492.~1663960301024973~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/.zarray.__tmp6305613955940868417.~1663960300685131~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95f9757546bc379e76a6fe51ee02ecf5d472ec4988f6b69be923e494cece374b
|
| 3 |
+
size 7819544
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8187ebf2d4d7656cc55fefdfbc2ff05ec3b4007344c413c7bd7d5384e2499b90
|
| 3 |
+
size 7832115
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7c93415721e5e736588fc6d57197e484f433cae527a231eb5dff9df62eca80a
|
| 3 |
+
size 7826719
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91b70bfa665d07a2aa8cb4d3ba1b37f650f42bc325115ac913b94c04b5d17c90
|
| 3 |
+
size 7820634
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f5b2c1ffdad75929d14a5050def62c5173406acf817bfe004c8117083a55696
|
| 3 |
+
size 7820443
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fdfc5940799378b89cbf621052756ce14bb156796020856bad475295a5f8bca
|
| 3 |
+
size 7824835
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12658d96a1d5399806fb8cba10b668a15eb6d747607620157e1fc318217ccb60
|
| 3 |
+
size 7820163
|
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:269d674efbf99ddb7e7b0a181bd7e83360f3747eefad8da956ed7bfb7544f4b9
|
| 3 |
+
size 7818451
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/.zarray.__tmp1396208861180522139.~1663960300554631~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33899193e9fbfadc927f4383631b298455622b45cb4d4d43dc82735168309245
|
| 3 |
+
size 19535000
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:480b24b2ac2707cfc36a4bbc297ee13bb75f3acebd243faec95efd11aa3b9405
|
| 3 |
+
size 19535430
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8902ba44b86bc3b24fe339bee2c5afff16685d7288668ea29c01893d8d4b9b23
|
| 3 |
+
size 19535014
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b58ea61bbf3e9b6f583b7fc9d7ebdbc3dd07643ba8ec13a86b94f0e7b695534
|
| 3 |
+
size 19535064
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a12369583b11afbfeb6cc9e4abbba0401f1d58fe5d57cc069051fa6024b9a88d
|
| 3 |
+
size 19535530
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85d6cbcdba4272ff940f4d8b7f0897277c8631950973bdf44f86ba23f6cf9d5f
|
| 3 |
+
size 19535689
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4764a6a7d63c7ef88f11fa11030a7353044965c5fdfbd6eb540d588499bf6c17
|
| 3 |
+
size 19535492
|
checkpoint_1007000/target.decoder.layers_20.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35480bd853f075cb83ef38a238d3f5920a0e41cda34c8b79d84462f5ee4c206d
|
| 3 |
+
size 19534696
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp11929326860362079676.~1663960300500846~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1245922900176289008.~1663960300384432~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1577452788764155663.~1663960300309792~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp1962892791003305179.~1663960300425311~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp4960023367428288268.~1663960300504905~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp7760782348285584253.~1663960300777117~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/.zarray.__tmp9690779028244793549.~1663960300501480~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecbe367dc69840807639175e8c7fe7348b09e7dcd9a7e483f8418aa4125f61e3
|
| 3 |
+
size 19542845
|