Commit
·
9285b52
1
Parent(s):
e236c2e
Upload part 6
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +47 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp10135903445638339427.~1663960300221626~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp15507812795183926116.~1663960300134744~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp17065918891033066108.~1663960300134056~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp18363071669361196615.~1663960300547865~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp6797235863693479551.~1663960299959197~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp7409568337816840167.~1663960299927439~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp8028295925901000216.~1663960300229282~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11320218080532855352.~1663960300727544~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11702983487948047717.~1663960300176124~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11862445357819568910.~1663960300423714~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp12414193912703064600.~1663960300386823~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp14430341800417598516.~1663960300550949~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp14750303897168474789.~1663960300822410~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp8147988125675658115.~1663960300471373~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp13092359546786096813.~1663960300309759~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp4485941798968990089.~1663960300826958~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp7679950611991273755.~1663960300685678~ +1 -0
- checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp3472968707658101185.~1663960300684343~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp4835589720425785741.~1663960300553600~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp7560343720225524633.~1663960300728619~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp7715507967913497315.~1663960300825238~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp8336891598979106534.~1663960300550514~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp9496274879502398214.~1663960300423477~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp9688532465646657114.~1663960300384325~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.2 +3 -0
.gitattributes
CHANGED
|
@@ -322,3 +322,50 @@ checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.6 filter
|
|
| 322 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 323 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 324 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 322 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 323 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 324 |
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 325 |
+
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 326 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 327 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 328 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 329 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 330 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 331 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 332 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 333 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 334 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 335 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 336 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 337 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 338 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 339 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 340 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 341 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 342 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 343 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 344 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 345 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 346 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 347 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 348 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 349 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 350 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 351 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 352 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 353 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 354 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 355 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 356 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 357 |
+
checkpoint_1007000/target.decoder.layers_6.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 358 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 359 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 360 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 361 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 362 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 363 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 364 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 365 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 366 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 367 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 368 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 369 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 370 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 371 |
+
checkpoint_1007000/target.decoder.layers_9.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp10135903445638339427.~1663960300221626~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp15507812795183926116.~1663960300134744~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp17065918891033066108.~1663960300134056~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp18363071669361196615.~1663960300547865~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp6797235863693479551.~1663960299959197~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp7409568337816840167.~1663960299927439~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/.zarray.__tmp8028295925901000216.~1663960300229282~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c400b582455f558e6a90ae341689fdfda08954a4f5a1ec5a0d63c95ba4ab1c9
|
| 3 |
+
size 7817009
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5164a1a65efb42c4aa61758b15532594077062971ae93a1453a6d8b20ad6402
|
| 3 |
+
size 7827137
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c7b1700e4064ce8df878894fa193e054c82ce00537716029fc0dacc301f29b6
|
| 3 |
+
size 7817891
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7bccd42d7fd4235de76193df124ff5afcd74b53e09ea0a23a1c1843c311e9e0
|
| 3 |
+
size 7818227
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d20a7051b8b0569119517fa06d0e0d9f71a9bf3479077bca801f426c2874f4a
|
| 3 |
+
size 7816840
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:559abbe3b521f9c5c52500951a432efefc36a8df1cd02750df057fd4f35a317a
|
| 3 |
+
size 7817296
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a39ccb548d7e2735a7775c69e2e2650f19f789e9a3e3daea956e31e362f543c
|
| 3 |
+
size 7816975
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0fc21154b380da00f80611ca388dade4183f0d38ca4541e7c2efe4427ff4d1b3
|
| 3 |
+
size 7816995
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11320218080532855352.~1663960300727544~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11702983487948047717.~1663960300176124~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp11862445357819568910.~1663960300423714~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp12414193912703064600.~1663960300386823~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp14430341800417598516.~1663960300550949~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp14750303897168474789.~1663960300822410~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/.zarray.__tmp8147988125675658115.~1663960300471373~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe615caebca160ff4eab5969b5394898f2a73c391dcfa844ad3cf52e207853e5
|
| 3 |
+
size 7821266
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ad3faf292360f18369eb135bc755799b23dccbfebd87fedb5524f6565168dae
|
| 3 |
+
size 7819359
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ae73d2b6607250cd29ede50fd230ac494b07a552c1c970ca2839170b247fcec
|
| 3 |
+
size 7819404
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a788087ea3c579e24718e819d691b0fa2ccbce7077d13169f41cfe8e3b1e955
|
| 3 |
+
size 7819468
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6579151391f78e90ddc847a1b27e1615f17e287e6de92ed408d349914967b5ed
|
| 3 |
+
size 7819734
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15dbaf17c977f48efa423c28ae5db154c362293790006fc12142dd0a7b4dff4a
|
| 3 |
+
size 7820257
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7af062448337b70b9921d565d76fb0f0f60a799e2a564d93b5e8148474374a4
|
| 3 |
+
size 7818976
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df63fe586819acc3d7c3002727b89920a7f2d3995edfb5f06837ba62d6fde79e
|
| 3 |
+
size 7819116
|
checkpoint_1007000/target.decoder.layers_13.pre_cross_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.pre_cross_attention_layer_norm.scale/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp13092359546786096813.~1663960300309759~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp4485941798968990089.~1663960300826958~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/.zarray.__tmp7679950611991273755.~1663960300685678~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_21.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53d8ce0c079b84ed5782ce34340294896e37498ac58f2b41af66048060ec6dd4
|
| 3 |
+
size 7807892
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp3472968707658101185.~1663960300684343~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp4835589720425785741.~1663960300553600~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp7560343720225524633.~1663960300728619~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp7715507967913497315.~1663960300825238~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp8336891598979106534.~1663960300550514~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp9496274879502398214.~1663960300423477~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/.zarray.__tmp9688532465646657114.~1663960300384325~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6614e2177b3c4147425e3ddf17969cc2f4e48250b61174ee06cce5d9dd8ff140
|
| 3 |
+
size 7809229
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ff5a6d3b44c5325e41f7b363d22c41be4c940cd592908938cb556c9f37f9cb5
|
| 3 |
+
size 7807827
|
checkpoint_1007000/target.decoder.layers_23.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d94fb08d28dbe9e7ea57349af4248e510c76f0eaf1b1d31c4528c8f6d9f9c1b3
|
| 3 |
+
size 7807918
|