Commit
·
33078ab
1
Parent(s):
dd782e0
Upload part 18
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +68 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp10838654574173738215.~1663960300550287~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp11875305851065103450.~1663960300688646~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp12537958174684117772.~1663960300626129~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp1677634420630541774.~1663960300470995~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp17343839063719239799.~1663960300888493~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp3493309919975632425.~1663960300423452~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp6832070039369596802.~1663960300938650~ +1 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray.__tmp2226082934896298061.~1663960300070624~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray.__tmp6195976044653281671.~1663960300129906~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp13077609528304263398.~1663960300822004~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp15300237782700791169.~1663960300601566~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp17028252708319300563.~1663960300384469~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp18202548913611701275.~1663960300547347~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp18277620472645960770.~1663960300825426~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp2569266975543125332.~1663960300688523~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp3167696657902769257.~1663960300632884~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp10230674669555981316.~1663960300466334~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp11987629423212589390.~1663960300941073~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp16268122409390166746.~1663960300683293~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp16721651795984952837.~1663960300501348~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp17936386360462204511.~1663960300729840~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp18320135420151810529.~1663960300687044~ +1 -0
- checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp6575118895601473476.~1663960300420632~ +1 -0
.gitattributes
CHANGED
|
@@ -901,3 +901,71 @@ checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.2 filter=lfs diff=
|
|
| 901 |
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 902 |
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 903 |
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 901 |
checkpoint_1007000/target.decoder.layers_12.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 902 |
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 903 |
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 904 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 905 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 906 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 907 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 908 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 909 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 910 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 911 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 912 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 913 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 914 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 915 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 916 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 917 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 918 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 919 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 920 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 921 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 922 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 923 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 924 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 925 |
+
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 926 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 927 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 928 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 929 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 930 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 931 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 932 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 933 |
+
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 934 |
+
checkpoint_1007000/target.token_embedder.embedding/15.0 filter=lfs diff=lfs merge=lfs -text
|
| 935 |
+
checkpoint_1007000/target.token_embedder.embedding/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 936 |
+
checkpoint_1007000/target.token_embedder.embedding/9.0 filter=lfs diff=lfs merge=lfs -text
|
| 937 |
+
checkpoint_1007000/target.token_embedder.embedding/21.0 filter=lfs diff=lfs merge=lfs -text
|
| 938 |
+
checkpoint_1007000/target.token_embedder.embedding/12.0 filter=lfs diff=lfs merge=lfs -text
|
| 939 |
+
checkpoint_1007000/target.token_embedder.embedding/61.0 filter=lfs diff=lfs merge=lfs -text
|
| 940 |
+
checkpoint_1007000/target.token_embedder.embedding/22.0 filter=lfs diff=lfs merge=lfs -text
|
| 941 |
+
checkpoint_1007000/target.token_embedder.embedding/28.0 filter=lfs diff=lfs merge=lfs -text
|
| 942 |
+
checkpoint_1007000/target.token_embedder.embedding/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 943 |
+
checkpoint_1007000/target.token_embedder.embedding/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 944 |
+
checkpoint_1007000/target.token_embedder.embedding/31.0 filter=lfs diff=lfs merge=lfs -text
|
| 945 |
+
checkpoint_1007000/target.token_embedder.embedding/14.0 filter=lfs diff=lfs merge=lfs -text
|
| 946 |
+
checkpoint_1007000/target.token_embedder.embedding/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 947 |
+
checkpoint_1007000/target.token_embedder.embedding/37.0 filter=lfs diff=lfs merge=lfs -text
|
| 948 |
+
checkpoint_1007000/target.token_embedder.embedding/59.0 filter=lfs diff=lfs merge=lfs -text
|
| 949 |
+
checkpoint_1007000/target.token_embedder.embedding/27.0 filter=lfs diff=lfs merge=lfs -text
|
| 950 |
+
checkpoint_1007000/target.token_embedder.embedding/56.0 filter=lfs diff=lfs merge=lfs -text
|
| 951 |
+
checkpoint_1007000/target.token_embedder.embedding/40.0 filter=lfs diff=lfs merge=lfs -text
|
| 952 |
+
checkpoint_1007000/target.token_embedder.embedding/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 953 |
+
checkpoint_1007000/target.token_embedder.embedding/24.0 filter=lfs diff=lfs merge=lfs -text
|
| 954 |
+
checkpoint_1007000/target.token_embedder.embedding/60.0 filter=lfs diff=lfs merge=lfs -text
|
| 955 |
+
checkpoint_1007000/target.token_embedder.embedding/43.0 filter=lfs diff=lfs merge=lfs -text
|
| 956 |
+
checkpoint_1007000/target.token_embedder.embedding/47.0 filter=lfs diff=lfs merge=lfs -text
|
| 957 |
+
checkpoint_1007000/target.token_embedder.embedding/32.0 filter=lfs diff=lfs merge=lfs -text
|
| 958 |
+
checkpoint_1007000/target.token_embedder.embedding/33.0 filter=lfs diff=lfs merge=lfs -text
|
| 959 |
+
checkpoint_1007000/target.token_embedder.embedding/35.0 filter=lfs diff=lfs merge=lfs -text
|
| 960 |
+
checkpoint_1007000/target.token_embedder.embedding/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 961 |
+
checkpoint_1007000/target.token_embedder.embedding/8.0 filter=lfs diff=lfs merge=lfs -text
|
| 962 |
+
checkpoint_1007000/target.token_embedder.embedding/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 963 |
+
checkpoint_1007000/target.token_embedder.embedding/38.0 filter=lfs diff=lfs merge=lfs -text
|
| 964 |
+
checkpoint_1007000/target.token_embedder.embedding/54.0 filter=lfs diff=lfs merge=lfs -text
|
| 965 |
+
checkpoint_1007000/target.token_embedder.embedding/20.0 filter=lfs diff=lfs merge=lfs -text
|
| 966 |
+
checkpoint_1007000/target.token_embedder.embedding/50.0 filter=lfs diff=lfs merge=lfs -text
|
| 967 |
+
checkpoint_1007000/target.token_embedder.embedding/30.0 filter=lfs diff=lfs merge=lfs -text
|
| 968 |
+
checkpoint_1007000/target.token_embedder.embedding/29.0 filter=lfs diff=lfs merge=lfs -text
|
| 969 |
+
checkpoint_1007000/target.token_embedder.embedding/11.0 filter=lfs diff=lfs merge=lfs -text
|
| 970 |
+
checkpoint_1007000/target.token_embedder.embedding/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 971 |
+
checkpoint_1007000/target.token_embedder.embedding/58.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp10838654574173738215.~1663960300550287~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp11875305851065103450.~1663960300688646~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp12537958174684117772.~1663960300626129~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp1677634420630541774.~1663960300470995~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp17343839063719239799.~1663960300888493~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp3493309919975632425.~1663960300423452~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/.zarray.__tmp6832070039369596802.~1663960300938650~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8474eac0fcbed2fbfb14ebc5a1a5b197c48f11edec67cc9127c7a5ce36444383
|
| 3 |
+
size 19525094
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e84181f8cff3f132a4faeee32cbce5f4748c1bbfc27c4f42cf4b41913ad4699
|
| 3 |
+
size 19524374
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63814fd4055b50dac059dd36f5805ad8898130c78ed99d07081dca620a652169
|
| 3 |
+
size 19524440
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:582115fb2f0f596f018756c26090d34f49b93edb486a68d88cc3c7e4448391e3
|
| 3 |
+
size 19525189
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8acde6fee0d28d72e2203c4dad3bbc730b91495fc286a17a270e2edcfb8b149e
|
| 3 |
+
size 19524598
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c4216285d75616e6d08137d2ac88b9c0bcc80d191fba380679e350ec2994d34
|
| 3 |
+
size 19523640
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9a80435f6643945eeb4bb5bbf4f1a47dd2c56ff012efec1845d72943f08ff27
|
| 3 |
+
size 19525633
|
checkpoint_1007000/target.decoder.layers_22.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55fd097fb39638f3bf4146464249492eff589af08b2dc09d2f15e5a84b31d3bc
|
| 3 |
+
size 19525769
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray.__tmp2226082934896298061.~1663960300070624~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/.zarray.__tmp6195976044653281671.~1663960300129906~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57db7b29484f45254010a616bfcf543c115e11719ce81487d1ce3ca64813ead5
|
| 3 |
+
size 7809733
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0caa8ba5d30171353427ba65dae0c355d0cfcf58ae3ed9944b567bbbe1502e9
|
| 3 |
+
size 7813010
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:301c5151f890bf2367219ea1bbcc07d7530a153784091e5fda4c201487a24f0e
|
| 3 |
+
size 7810155
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0753255edb6caca5db013e845f2809085287c88322906acf4f3558b00d5f7a81
|
| 3 |
+
size 7824090
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e821db7d0a7b1d18a3b3966782cb03723c8ee9a5bdc70d43c0f924ec7ca310e0
|
| 3 |
+
size 7814367
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91fbfbf0e4edbc6e8a6059699862ec60465a455398c14f28c34b8c5796970e44
|
| 3 |
+
size 7813723
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp13077609528304263398.~1663960300822004~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp15300237782700791169.~1663960300601566~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp17028252708319300563.~1663960300384469~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp18202548913611701275.~1663960300547347~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp18277620472645960770.~1663960300825426~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp2569266975543125332.~1663960300688523~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/.zarray.__tmp3167696657902769257.~1663960300632884~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3f178cded7ac1e6ad4afb1ef2067e1a7bf099433b1857965aed671c42d271ca
|
| 3 |
+
size 7815537
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:779e9db5131dfa2baa6bea8c5fc2eb2bd8156481484ad082dc27b68a6b4eb80a
|
| 3 |
+
size 7815228
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e0732a9fcf6839eb0346c3148b604d92e119d0017f63f9c06e63262b9f63d3e
|
| 3 |
+
size 7815959
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0dac80266e959015966a450450117e8a50d35f07fb975286f8e2f394c03e1cb7
|
| 3 |
+
size 7816486
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cdb2fee1ee51240fe91ea860658365da5a22ad12d386ae6d959d960ad1a8465
|
| 3 |
+
size 7813637
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c342b505d23adf5d349e281ba209fdb3e3471fe572b33c1aa737f99422c937d
|
| 3 |
+
size 7818402
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28f71c34dc066d08d14145e391327e228af3a4db730da84312a27c9b33f5d27c
|
| 3 |
+
size 7817166
|
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f164c30b2e2911921e232947f5739c5d3a19b64fea180bdaddda8321088d151a
|
| 3 |
+
size 7814462
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp10230674669555981316.~1663960300466334~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp11987629423212589390.~1663960300941073~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp16268122409390166746.~1663960300683293~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp16721651795984952837.~1663960300501348~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp17936386360462204511.~1663960300729840~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp18320135420151810529.~1663960300687044~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.self_attention.key.kernel/.zarray.__tmp6575118895601473476.~1663960300420632~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|