Commit
·
6ccb29c
1
Parent(s):
4f1fdb7
Upload part 27
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +51 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp15354685998123179540.~1663960300495111~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp16170028922246737233.~1663960300385482~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp17288873837878801007.~1663960300549708~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp577301364692537855.~1663960300632117~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp7283641247067179797.~1663960300683760~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp896724262472385512.~1663960300986807~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp9312776218164125947.~1663960300940889~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp14493264947335317128.~1663960300546923~ +1 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp740157777808966451.~1663960300351573~ +1 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp922837810789523104.~1663960300865802~ +1 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp10325228294865560130.~1663960300941375~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp11198960157786008892.~1663960300546819~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp1273332649516111222.~1663960300778415~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp15121084618146118760.~1663960300548752~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp15475646191937215619.~1663960300384575~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp3233461844801345740.~1663960300421881~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp6060468192151190772.~1663960300686175~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/.zarray.__tmp12534806932945011317.~1663960300688775~ +1 -0
.gitattributes
CHANGED
|
@@ -1391,3 +1391,54 @@ checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/6.0 filter=lfs diff=lf
|
|
| 1391 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1392 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1393 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1391 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1392 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1393 |
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1394 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1395 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1396 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1397 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1398 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1399 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1400 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1401 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1402 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1403 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1404 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1405 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1406 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1407 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1408 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1409 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1410 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1411 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1412 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1413 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1414 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1415 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1416 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1417 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1418 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1419 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1420 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1421 |
+
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1422 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1423 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1424 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1425 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1426 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1427 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1428 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1429 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1430 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1431 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1432 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1433 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1434 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1435 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1436 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1437 |
+
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1438 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1439 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1440 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1441 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1442 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1443 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1444 |
+
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp15354685998123179540.~1663960300495111~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp16170028922246737233.~1663960300385482~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp17288873837878801007.~1663960300549708~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp577301364692537855.~1663960300632117~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp7283641247067179797.~1663960300683760~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp896724262472385512.~1663960300986807~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/.zarray.__tmp9312776218164125947.~1663960300940889~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c4ffaf1bd9dc95084bed6ab73f23822a0ac282e55461869fe449385432f55b6
|
| 3 |
+
size 7802033
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f46cf1324687e56108d5f2a5ccfeee5fb82b6be0895b6cb76caa58ec2a3542f2
|
| 3 |
+
size 7808083
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d0f15702032b0808e538f339db33a9d93d3a3da4702a28cb601e077ea8591e4
|
| 3 |
+
size 7804878
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91ae3e7990804ac570c14fd6d989a4edcd789797c11fac5b97007495ebabde2c
|
| 3 |
+
size 7800056
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4998a8e7518db32a6e52ec551def2fce5781f9ef9dd9064d9ffb7fd0ba6da8a4
|
| 3 |
+
size 7809293
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f82e906784b49e4a334d8ee6a229c21a6ba00d3446e128f06440b35c0a0112b
|
| 3 |
+
size 7805952
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e52bbfbb807d56369de45cdd5e1b425cf3795be4db5897ef01e076fa908e7c70
|
| 3 |
+
size 7799523
|
checkpoint_1007000/target.decoder.layers_17.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28e1d6a140b616eb6f65f41644c67d0b503f38fa20bb7afda7086c5b7f92e088
|
| 3 |
+
size 7804405
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp14493264947335317128.~1663960300546923~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp740157777808966451.~1663960300351573~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/.zarray.__tmp922837810789523104.~1663960300865802~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8832c8ba44b539481f0251a9cdaac1c51d59e87a02a3ef94f6186e66453f5a64
|
| 3 |
+
size 7800716
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb3ec5e7c96a71168f3b0581c0adb682486fa329728bb95c09cb8da5ffef2be8
|
| 3 |
+
size 7801871
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6e804e692c942f8046103e10829501c1406078d82ec40161615b0ebdfb6964c
|
| 3 |
+
size 7799099
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f526f17ee9354fc37548ac58c666c5fad45546f0f9eaee3973f5bc9436cff7e1
|
| 3 |
+
size 7802121
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:277dd2da62e68b79598688b85cc6f0cc923a4a26bf3095350552e3f0dab6226d
|
| 3 |
+
size 7802930
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a071bb0f38dbc1e28e52247aa6b6d38ef501935e5455626beda95be7880bd910
|
| 3 |
+
size 7803056
|
checkpoint_1007000/target.decoder.layers_19.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2a4ac1cc69caa671ddd70d2743ce43869bbe1043ebc98eda58fc5a0ddc7c8e9
|
| 3 |
+
size 7801928
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp10325228294865560130.~1663960300941375~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp11198960157786008892.~1663960300546819~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp1273332649516111222.~1663960300778415~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp15121084618146118760.~1663960300548752~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp15475646191937215619.~1663960300384575~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp3233461844801345740.~1663960300421881~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/.zarray.__tmp6060468192151190772.~1663960300686175~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3023aa7df4276d602d908726bfa713b3c930e58ff2af700e16b8d3ceed6429cb
|
| 3 |
+
size 19540101
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b287f6c55f5cdb1fd02568849a05806baf5c182fffb1bedf7927808f6c803e91
|
| 3 |
+
size 19540453
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f93283f1ce8a735987888eb089b20e47e83e02fe638c357f9e709e711213ebe
|
| 3 |
+
size 19540390
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5ade6ac36c93d8ed9fb4e1615b9e28d25c653f97eb609a016326afc9edbc097
|
| 3 |
+
size 19537245
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:077c6ad75e7bb83b246e619e36fc06c1e301bb0bbc84abb0e0078ee225839152
|
| 3 |
+
size 19539587
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b23853338102374d509a204c1fc3f2b80e4621f3870cec280a41cde779558c1
|
| 3 |
+
size 19539668
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08a5585fdf1ad7f912df2eea9500e12feb918a9769122dd8002633ac0a380a9a
|
| 3 |
+
size 19538894
|
checkpoint_1007000/target.decoder.layers_7.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1d3851f45e41f8825e69b2a04ca8a079705ee46c240467b492ae7271e6dc73b
|
| 3 |
+
size 19540452
|
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_10.attention.value.kernel/.zarray.__tmp12534806932945011317.~1663960300688775~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|