Commit
·
0ffa27c
1
Parent(s):
eeee4a0
Upload part 41
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp12230286070092369206.~1663960300221050~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp16267921910235602799.~1663960300549410~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5246829436242909868.~1663960300688232~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp6353388612993010442.~1663960300422197~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp12136563829991507271.~1663960301113503~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp3457622141945448487.~1663960300499676~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp6268435365437568753.~1663960300729856~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp7774465868499159884.~1663960300686147~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp7941873133752388418.~1663960300495124~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp8183231251891778243.~1663960300824537~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp8656452909198619698.~1663960300624128~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp11166149644689455463.~1663960300312595~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp15141465125797667691.~1663960300686421~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp17308594760492408895.~1663960300500855~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp3977819417319812257.~1663960300554587~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp5002560965119657100.~1663960300421610~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp5438925230043786321.~1663960300386435~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp9071740213102679831.~1663960300730159~ +1 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_10.pre_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_10.pre_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp10302074379200713571.~1663960300425055~ +1 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp11423431248944960156.~1663960301112616~ +1 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp1157397987198533595.~1663960300472110~ +1 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp14430047787721319826.~1663960300887469~ +1 -0
- checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp16989890204922139169.~1663960300624147~ +1 -0
.gitattributes
CHANGED
|
@@ -2087,3 +2087,51 @@ checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kern
|
|
| 2087 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2088 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2089 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2087 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2088 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2089 |
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2090 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2091 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2092 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2093 |
+
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2094 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2095 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2096 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2097 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2098 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2099 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2100 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2101 |
+
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2102 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2103 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2104 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2105 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2106 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2107 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2108 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2109 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2110 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2111 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2112 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2113 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2114 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2115 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2116 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2117 |
+
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2118 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2119 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2120 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2121 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2122 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2123 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2124 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2125 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2126 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2127 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2128 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2129 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2130 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2131 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2132 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2133 |
+
checkpoint_1007000/target.encoder.layers_4.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2134 |
+
checkpoint_1007000/target.encoder.layers_21.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2135 |
+
checkpoint_1007000/target.encoder.layers_21.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2136 |
+
checkpoint_1007000/target.encoder.layers_21.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2137 |
+
checkpoint_1007000/target.encoder.layers_21.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp12230286070092369206.~1663960300221050~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp16267921910235602799.~1663960300549410~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp5246829436242909868.~1663960300688232~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/.zarray.__tmp6353388612993010442.~1663960300422197~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6d25e911a98fb3aeb8dd18513dd6b05e46f9509f0b688c57f54812a9c2064ae
|
| 3 |
+
size 7818020
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:509ff18402d3974c08b9921f44d2c8d980acf280c8bdcdcf214ff86933ad66af
|
| 3 |
+
size 7817763
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:827784a57da000a938011bc280808bff8257335de8d6e9e8acdd058a4f6af9cd
|
| 3 |
+
size 7819675
|
checkpoint_1007000/target.decoder.layers_16.encoder_decoder_attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88dadbdc3a8eb995c51e975fc9bdc0ce08e82132b29880af176a1be859b5c6d2
|
| 3 |
+
size 7818141
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp12136563829991507271.~1663960301113503~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp3457622141945448487.~1663960300499676~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp6268435365437568753.~1663960300729856~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp7774465868499159884.~1663960300686147~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp7941873133752388418.~1663960300495124~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp8183231251891778243.~1663960300824537~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/.zarray.__tmp8656452909198619698.~1663960300624128~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d44701569561a2e3629833b8e77a88f2c1af8b23b69f50f25307def5a2ee0fa
|
| 3 |
+
size 7821915
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fb3e69d6e29b5ae4a9d1c230ef8b6724bf001839ea349da3e39df44f6a943db
|
| 3 |
+
size 7831993
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcc036b5d64f6958f64a4693f6f1ab816d249012f4c9803bf772ebcc4c1863be
|
| 3 |
+
size 7827013
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdf9ae9d0b7f13b4ca20113f70f65ea2a0ff64e333474b9e4f37e89975ee731c
|
| 3 |
+
size 7828743
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a9cc0ce39d7d0b4ddb11635520d6bc91bf769465124a7efe887725df2dd4868
|
| 3 |
+
size 7833751
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5269e36936270b25bdea999d0312bafbfa8238fe9e3a4567f31153cd7742962f
|
| 3 |
+
size 7827045
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0b3e48524254caa30150db0055b9be2c3991d608ca9d3d52ef2a82b93948b56
|
| 3 |
+
size 7838761
|
checkpoint_1007000/target.decoder.layers_3.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:169a33f6ad62664ca8065622528c6e39ca3a6e2c20d53f1974f7c9171c153938
|
| 3 |
+
size 7844577
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp11166149644689455463.~1663960300312595~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp15141465125797667691.~1663960300686421~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp17308594760492408895.~1663960300500855~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp3977819417319812257.~1663960300554587~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp5002560965119657100.~1663960300421610~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp5438925230043786321.~1663960300386435~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/.zarray.__tmp9071740213102679831.~1663960300730159~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0398d120c63624365d5a9ebfe764d220c0c97b02ff98ae181a7d006ddefc445
|
| 3 |
+
size 19494961
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3540e58b05b53a8dc0d974726a6ecf65bf56a9ce6ce5a85e390689f3bba7e6cc
|
| 3 |
+
size 19494764
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f85fad8e77281d23dd8b85b0b4801e9a2d6fd92cf03cb4d089537595ec5f23bc
|
| 3 |
+
size 19494071
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b50f0e52d6a037f233af71b0a79e654febd26fe8ef1ceda840ca3b81709f5ef
|
| 3 |
+
size 19493838
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ae38d507341c919bc414bb7b064f317b93229ce86e1e39064647fa541ebe94a
|
| 3 |
+
size 19494556
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33ae8a8e66417dcb2a0644e70145e6610a1c4e73d2ec7f6c378de60f684cd570
|
| 3 |
+
size 19495259
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5e923b82f9f9a65dcc35fc7ae3c498cc73c3f7db776cef8fca76b2862bfde8f
|
| 3 |
+
size 19495050
|
checkpoint_1007000/target.encoder.layers_1.mlp.wi_0.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d24caa8c636afb0ce28dece58f577b9714ae859883b0fde8b8030bae8124fc2
|
| 3 |
+
size 19493988
|
checkpoint_1007000/target.encoder.layers_10.pre_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_10.pre_attention_layer_norm.scale/0
ADDED
|
Binary file (15.2 kB). View file
|
|
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp10302074379200713571.~1663960300425055~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp11423431248944960156.~1663960301112616~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp1157397987198533595.~1663960300472110~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp14430047787721319826.~1663960300887469~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp16989890204922139169.~1663960300624147~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|