Commit
·
e42c1df
1
Parent(s):
651860e
Upload part 44
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +50 -0
- checkpoint_1007000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_21.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_21.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_12.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp13317862693414254449.~1663960300266463~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp18351130551550344796.~1663960300986535~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp282961741546003797.~1663960300014359~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp3981875622317747831.~1663960300134002~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp9770001286954173129.~1663960300268068~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp14755775162671015479.~1663960300313196~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp15929711136369962275.~1663960300466126~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp3211724514550199944.~1663960300686406~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp5542698970820471895.~1663960300504670~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp5757567167324112445.~1663960300775434~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp9536086688303990048.~1663960300420628~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp9613167283394802845.~1663960300622402~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray.__tmp13557785600670434127.~1663960300070675~ +1 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray.__tmp3142583028134086573.~1663960300087867~ +1 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp14933477324427723908.~1663960300554232~ +1 -0
.gitattributes
CHANGED
|
@@ -2237,3 +2237,53 @@ checkpoint_1007000/target.encoder.layers_4.attention.value.kernel/0.2 filter=lfs
|
|
| 2237 |
checkpoint_1007000/target.encoder.layers_4.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2238 |
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2239 |
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2237 |
checkpoint_1007000/target.encoder.layers_4.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2238 |
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2239 |
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2240 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2241 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2242 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2243 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2244 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2245 |
+
checkpoint_1007000/target.encoder.layers_22.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2246 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2247 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2248 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2249 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2250 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2251 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2252 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2253 |
+
checkpoint_1007000/target.encoder.layers_8.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2254 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2255 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2256 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2257 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2258 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2259 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2260 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2261 |
+
checkpoint_1007000/target.encoder.layers_9.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2262 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2263 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2264 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2265 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2266 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2267 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2268 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2269 |
+
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2270 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2271 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2272 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2273 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2274 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2275 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2276 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2277 |
+
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2278 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2279 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2280 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2281 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2282 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2283 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2284 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2285 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2286 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2287 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2288 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2289 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.9 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_21.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_21.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.4 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_12.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp13317862693414254449.~1663960300266463~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp18351130551550344796.~1663960300986535~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp282961741546003797.~1663960300014359~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp3981875622317747831.~1663960300134002~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/.zarray.__tmp9770001286954173129.~1663960300268068~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7960fb893fe2dac92b7fa93a0bb80569a87a012d3951145a9f778fe34cf4ee2d
|
| 3 |
+
size 7817722
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:824b26e4bccfc6a5e1ebc0e3cacaf8695057509a6fff8d2214ba70ac11d3e7c5
|
| 3 |
+
size 7817686
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4634c7a1e6a40b31ccbe1ef9485a2330341d6956098240b4871f3b11c5119779
|
| 3 |
+
size 7818607
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf8b8656b9b62fc00f8c0c3732fcef73b33d1ec34f11c72be713ce4c438a201a
|
| 3 |
+
size 7819206
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c491e23dd2865b7a66b7e06b8c046c66ac3c5edcbb8cc784090b3f4f2eb635cb
|
| 3 |
+
size 7817334
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47ccce5b4f0a7fbfa2c6d6a847cff8a3df46d89110154ea38ccc428e9b6f05be
|
| 3 |
+
size 7817902
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:805e10892b9a692b20413f4f1dc3d854d255547037c99253dc2781367403a4e1
|
| 3 |
+
size 7818753
|
checkpoint_1007000/target.decoder.layers_11.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eea6a1e47981f1f2afee929609ae82d10f0b5f743c6759b9a125d6c9e4656ea0
|
| 3 |
+
size 7817893
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp14755775162671015479.~1663960300313196~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp15929711136369962275.~1663960300466126~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp3211724514550199944.~1663960300686406~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp5542698970820471895.~1663960300504670~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp5757567167324112445.~1663960300775434~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp9536086688303990048.~1663960300420628~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/.zarray.__tmp9613167283394802845.~1663960300622402~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12ce1381cf2febf93d6a7ec9bbb6be4b0c6a9877c55515f20fa48d3b47de5312
|
| 3 |
+
size 7803437
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4ceb3a689397ed013780b08c7e82f4883eb5709491d111a5f07087c0db4faf1
|
| 3 |
+
size 7804047
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d58c3ef1bba3427b79468a212b805f67ff973ae7396fd09002a22af391db0ad8
|
| 3 |
+
size 7809740
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:627d2237fd256e19ad540b450568ea5b17d3e0a81f41ec8c0f5073688f55d04d
|
| 3 |
+
size 7803345
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9915e5c6769013b943753c4a23e3e57abb129bf485bbf7befc79852453b0d03e
|
| 3 |
+
size 7807705
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7d7ac10eae42c145a13ca94d6dfdfc81e1a65defaa39396076b6756413cfc21
|
| 3 |
+
size 7807067
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d9c4f6bb9ebdb65388a93610d2382fb2bb8248defc2891f4b1c733176124775
|
| 3 |
+
size 7806649
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:206703a0a9d6b238ae3bb06fdf454d211f4e884102ea276c0b767c96d5b34090
|
| 3 |
+
size 7809570
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray.__tmp13557785600670434127.~1663960300070675~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/.zarray.__tmp3142583028134086573.~1663960300087867~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01cdf0f52ebef390dc39091c67ecdb37c98b22bb857984b348e799930a8e4f43
|
| 3 |
+
size 7807700
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7da550d68a3c851242c291656346254965590577ae5b415ef0c111fa2b82833d
|
| 3 |
+
size 7805692
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a337032e72b0d809f9086488a864528e75cce7047dcf905a457ab00aa9287cb7
|
| 3 |
+
size 7804683
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2b8d64803d550be3a79f46ce1004a7d585a63453cd3723cf39f33748ac99c72
|
| 3 |
+
size 7803862
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e89405738cc9fb550a4e026dcd02371fba2e193bf82b7c80510bcd2bb0565576
|
| 3 |
+
size 7804358
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ced267946938aa9c1c23c83afbdc583da75e71a00ac4b18be10ae790ad0d326
|
| 3 |
+
size 7806170
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86b4dcfa0b03c0e2fd3bf9f8d831804b07775835dab08a0b98be808ac4c80cd6
|
| 3 |
+
size 7808337
|
checkpoint_1007000/target.encoder.layers_12.attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cbb6d12a558b827cf7f37aafb3ed797b43bcd394b31c0dbcbbd58f6de8dae43
|
| 3 |
+
size 7807169
|
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/.zarray.__tmp14933477324427723908.~1663960300554232~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|