Commit ·
dd782e0
1
Parent(s): 1153a1f
Upload part 17
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +50 -0
- checkpoint_1007000/target.decoder.layers_1.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp12266758972892400602.~1663960300070885~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp16783166927373231934.~1663960299677983~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp2367932448935716136.~1663960299882250~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp5206876151419477825.~1663960299959263~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp9180771959993893236.~1663960300018140~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp9622455220886004513.~1663960300178008~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp10259164110253181884.~1663960300501998~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp107405781971231021.~1663960300886228~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp13096478522792831033.~1663960300545878~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp13463644331749572668.~1663960300420504~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp14299296042507200098.~1663960300500161~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp15565572797164759058.~1663960300348146~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp10677792200381937821.~1663960300730839~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp14644581288504991737.~1663960300502666~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp16166340234170811950.~1663960300862291~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp3136584453132712714.~1663960300495902~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp5626792347056672524.~1663960300468255~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp7840518664900691065.~1663960300384009~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp8455163617466929986.~1663960300548751~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_15.pre_cross_attention_layer_norm.scale/.zarray +1 -0
.gitattributes
CHANGED
|
@@ -851,3 +851,53 @@ checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/7.0 filter=lfs d
|
|
| 851 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 852 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 853 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 851 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 852 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 853 |
checkpoint_1007000/target.encoder.layers_2.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 854 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 855 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 856 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 857 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 858 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 859 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 860 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 861 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 862 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 863 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 864 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 865 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 866 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 867 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 868 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 869 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 870 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 871 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 872 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 873 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 874 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 875 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 876 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 877 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 878 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 879 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 880 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 881 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 882 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 883 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 884 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 885 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 886 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 887 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 888 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 889 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 890 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 891 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 892 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 893 |
+
checkpoint_1007000/target.decoder.layers_15.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 894 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 895 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 896 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 897 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 898 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 899 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 900 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 901 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 902 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 903 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_1.pre_mlp_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.pre_mlp_layer_norm.scale/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp12266758972892400602.~1663960300070885~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp16783166927373231934.~1663960299677983~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp2367932448935716136.~1663960299882250~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp5206876151419477825.~1663960299959263~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp9180771959993893236.~1663960300018140~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/.zarray.__tmp9622455220886004513.~1663960300178008~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00e72e21a1a33cbdb1271bcee489c14ff79e8a61b39f7d6621fe1815d58991c2
|
| 3 |
+
size 7814760
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:206890647fd3431a6d97af1dc10217278c15336813811ff3699c5016a84aaf62
|
| 3 |
+
size 7809300
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e906996a0b44d76dc3a940aba142147b0bcd8809381597afb599fd826cf7862
|
| 3 |
+
size 7806525
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b1c21d922741c93f33138f7ee5b035c0cb301428b84b01a2d789e601890e762
|
| 3 |
+
size 7806295
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad00513840ce1bd270df015654f81d61b9e6cc0f0ac61d69719c199d58eda5aa
|
| 3 |
+
size 7811339
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00b57368c3696972535ec9c23426594704b64b1d8fd4cc78d41ab81e5baf115a
|
| 3 |
+
size 7809062
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a3fd050f885df95d5f2c4d52719f96086a570807887dbc9b3aeaf9c3c61f512d
|
| 3 |
+
size 7813137
|
checkpoint_1007000/target.decoder.layers_1.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faf30a56a37bea9547fea903c35acd37fb1faf4bfc94107f223426263af88e46
|
| 3 |
+
size 7810348
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp10259164110253181884.~1663960300501998~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp107405781971231021.~1663960300886228~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp13096478522792831033.~1663960300545878~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp13463644331749572668.~1663960300420504~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp14299296042507200098.~1663960300500161~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/.zarray.__tmp15565572797164759058.~1663960300348146~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e701045284592d46167f98d8b0ca3cbd3f175233ee523d820ca46904afd5b19
|
| 3 |
+
size 7836700
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69e2ab91407d61658011a725f64ec7dcfc48d82dd352f2996204ff542db4fc62
|
| 3 |
+
size 7834093
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5a5d15bf97535f622976e8a72b990f982af532e7aeefbabff7a42477a4de962
|
| 3 |
+
size 7833168
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30eabf37c6d5d18d617607835ff265792ee6f80d214ae69e6f4680913195d787
|
| 3 |
+
size 7823762
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dbf14057b42f25618bd415acdeda0cd2dfd7ec60f66151e2990a8c1882ecb3d
|
| 3 |
+
size 7830779
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98d13a3af30513ea35c73a17ffa996ba6d90896db2aaba0e70ce29a377c0bb09
|
| 3 |
+
size 7822361
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:689d5ba176f77fe9874bfa38fadfc0cddf8fda136ecb0bb033688ed10d88477c
|
| 3 |
+
size 7823730
|
checkpoint_1007000/target.decoder.layers_11.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e107e2baecc419ea6992436405df4e7fcb93e04aebf9649b9f423d8a067d5ee7
|
| 3 |
+
size 7821078
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp10677792200381937821.~1663960300730839~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp14644581288504991737.~1663960300502666~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp16166340234170811950.~1663960300862291~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp3136584453132712714.~1663960300495902~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp5626792347056672524.~1663960300468255~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp7840518664900691065.~1663960300384009~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/.zarray.__tmp8455163617466929986.~1663960300548751~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16ea89428eea453b34c5927542e1dc8f37706e7550b9574c099663d852c88dee
|
| 3 |
+
size 19524269
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:293b6a18356225f94ba2d5e6be0df46db4f89e77627f141cc25657b0d36d5e88
|
| 3 |
+
size 19525021
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5ddf0ce60e080b478e3be8e47fe61d961e35e530fdb5a3a6918dc111d445d53
|
| 3 |
+
size 19524066
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d20ba31b1805e960aa3b30fa85c8a80d4b8b0e064239e22668bd3baacface5d5
|
| 3 |
+
size 19524850
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a95e8d563e051a396bc98d958ac6fd6ecde95f1ca0de3a0a6cdbe1c60289e62b
|
| 3 |
+
size 19525125
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30b963abdaec46da0c1e6fce780898b0657f9ebfa8035dd544b69871a31ee02c
|
| 3 |
+
size 19525163
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:209d02007d91a08ecc550142c98fb5ae48f449eddb8f41859ed9e38fb073d0e9
|
| 3 |
+
size 19524548
|
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2ffa226e09b55ad16ad4dd656e6791c35f33408d6263a789ddc321e5a55e02
|
| 3 |
+
size 19524489
|
checkpoint_1007000/target.decoder.layers_15.pre_cross_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|