Commit
·
fbf19ae
1
Parent(s):
e9f3b02
Upload part 32
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +49 -0
- checkpoint_1007000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_10.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_20.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_20.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp12293737374257612135.~1663960300308679~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp13388884657439360929.~1663960300683677~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp14673227939187635924.~1663960300887724~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp4237423661826810814.~1663960300070821~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp7868827516398815433.~1663960300016688~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp15512240270656656792.~1663960300936511~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp16922826167621782989.~1663960300221043~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp3472997630134773701.~1663960300865030~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4662274339282745602.~1663960300731396~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4823290627812450517.~1663960300228855~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4947456744926543253.~1663960300308483~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp6560988738775241257.~1663960300551733~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/.zarray.__tmp5307870074451922335.~1663960300497948~ +1 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp10331289727090379592.~1663960300826103~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp12409451780220750098.~1663960300554266~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp13890749968340131481.~1663960301027457~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp13978340362905456387.~1663960300724952~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp16263027495398350293.~1663960300423032~ +1 -0
.gitattributes
CHANGED
|
@@ -1648,3 +1648,52 @@ checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/1.0 filter=lfs
|
|
| 1648 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1649 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1650 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1648 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1649 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1650 |
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1651 |
+
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1652 |
+
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1653 |
+
checkpoint_1007000/target.encoder.layers_10.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1654 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1655 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1656 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1657 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1658 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1659 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1660 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1661 |
+
checkpoint_1007000/target.encoder.layers_16.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1662 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1663 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1664 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1665 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1666 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1667 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1668 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1669 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1670 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1671 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1672 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1673 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1674 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1675 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1676 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1677 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1678 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1679 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1680 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1681 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1682 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1683 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1684 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1685 |
+
checkpoint_1007000/target.encoder.layers_6.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1686 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1687 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1688 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1689 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1690 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1691 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1692 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1693 |
+
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1694 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1695 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1696 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1697 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1698 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1699 |
+
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.1 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_20.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_20.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp12293737374257612135.~1663960300308679~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp13388884657439360929.~1663960300683677~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp14673227939187635924.~1663960300887724~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp4237423661826810814.~1663960300070821~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp7868827516398815433.~1663960300016688~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b2d1258d767b05decf96f6c34e086431c7e19a32302900d0bf2ff9b2ad66f59
|
| 3 |
+
size 19545749
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9b0b6fa0f690f26b797e2174b1621d69114bc916aa6d6dc84beed6393ed5dcd
|
| 3 |
+
size 19549072
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e88ab51df383ab917536359318fe3578460fe7cb05fc58345765b534a8ad2a02
|
| 3 |
+
size 19547695
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:256cb825c1987217b4391dd1f9b5385a91c15cf23147cf408a4fb16028f56978
|
| 3 |
+
size 19547035
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47fa1715cbca0649f2d9eb46e64d9956ef62c877b49470d8798a6bb339cec689
|
| 3 |
+
size 19548648
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed60f3351e6a0c7c6e1628ad20a0afe9c43795ef92c606303461a506a95e94d7
|
| 3 |
+
size 19546909
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90d26eb8c28ca3252d16fd9960c405eee179c74f4ca371ab8be46f5504f3624a
|
| 3 |
+
size 19546531
|
checkpoint_1007000/target.decoder.layers_1.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:463b9c7872ad9ae82d74e96340a5edcaf9f5a0141d003f19e667c67103b5f8b2
|
| 3 |
+
size 19545823
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp15512240270656656792.~1663960300936511~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp16922826167621782989.~1663960300221043~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp3472997630134773701.~1663960300865030~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4662274339282745602.~1663960300731396~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4823290627812450517.~1663960300228855~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp4947456744926543253.~1663960300308483~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/.zarray.__tmp6560988738775241257.~1663960300551733~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca84f49e15b1bd9e0086ecb596b1a3f002b6c97d62b0f6e40b39c59a2e20d3ed
|
| 3 |
+
size 19531628
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:278cf6e05a0c7ddab61faaabfc482ffada97d5cfb4797541e91183f173006bfc
|
| 3 |
+
size 19532132
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b84d017ab0f0c46e2e856aceca66358020a8522952809f7aa8e859c16983f893
|
| 3 |
+
size 19532831
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6874b076aed566fc87d0b5bcd5275eec9af6add03313e8c4d7aceb16e2a38e92
|
| 3 |
+
size 19532480
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a9fa9ef3962d7d84d93476e9b05119f0aa8dbc8afa18ae6402718d466c3cdb0
|
| 3 |
+
size 19531708
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0070cbcdd8dddd9f846caa44e0d133272a352d5146e03e5c0baebbf381b81236
|
| 3 |
+
size 19532952
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8cc984a6d2655810c24b682f24af6c8017c581b265f4f77317bd820ac7be9f7
|
| 3 |
+
size 19531855
|
checkpoint_1007000/target.decoder.layers_18.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2854551cd722e373fa568d1489cd7fd3e6805ec7f266b12d1849bda8a82edecb
|
| 3 |
+
size 19531650
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/.zarray.__tmp5307870074451922335.~1663960300497948~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f93e3de76e30aa9775203344220427cfbb4c42f557020bc71e3da969732305a0
|
| 3 |
+
size 7822496
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a893b741ae3bd8252c2c42281d1f05150e05bb8d295f71e3565bdff8209bacfa
|
| 3 |
+
size 7820977
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6012dd6d45b67926e0fc2179500b13628f0bdcaaaf6db19f55137ccfcd184d8d
|
| 3 |
+
size 7821915
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ed80ba03d04d7084bd97c8bd53305bd18dbdc74d94f347757f4d8486d1dd4bb
|
| 3 |
+
size 7822007
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae8ff296397aa6a248d747ac7da43759046149925df935e233965a462599a8d1
|
| 3 |
+
size 7820408
|
checkpoint_1007000/target.decoder.layers_6.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e326151e6d1c5fcecf1131315ce080d22067c027bd4e312251564230d5d6c56
|
| 3 |
+
size 7821443
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp10331289727090379592.~1663960300826103~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp12409451780220750098.~1663960300554266~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp13890749968340131481.~1663960301027457~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp13978340362905456387.~1663960300724952~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.query.kernel/.zarray.__tmp16263027495398350293.~1663960300423032~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|