Commit ·
f2038ac
1
Parent(s): 778d6b7
Upload part 13
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +53 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp14658094100065076136.~1663960300090561~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16230492432462742032.~1663960300387076~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16379259808268770224.~1663960300175113~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8894115837369550982.~1663960299882008~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8990031795982035122.~1663960299958555~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp11577145964185916981.~1663960300086131~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp9374932084099255530.~1663960300271661~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11094273487534505663.~1663960300308880~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11832826128042483391.~1663960300601290~ +1 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp11545495112761785230.~1663960300421208~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp13140827661821471681.~1663960300546318~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp15222983945689583177.~1663960300941715~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp162813558043179627.~1663960300688213~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp2276807198409161350.~1663960300385594~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp4389650834453463471.~1663960300423047~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp8798756328389882663.~1663960300552107~ +1 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp13440713807143523604.~1663960300863191~ +1 -0
- checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp14332112127674379251.~1663960300421660~ +1 -0
.gitattributes
CHANGED
|
@@ -650,3 +650,56 @@ checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel
|
|
| 650 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 651 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 652 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 650 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 651 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 652 |
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 653 |
+
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 654 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 655 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 656 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 657 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 658 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 659 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 660 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 661 |
+
checkpoint_1007000/target.encoder.layers_4.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 662 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 663 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 664 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 665 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 666 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 667 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 668 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 669 |
+
checkpoint_1007000/target.encoder.layers_22.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 670 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 671 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 672 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 673 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 674 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 675 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 676 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 677 |
+
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 678 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 679 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 680 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 681 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 682 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 683 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 684 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 685 |
+
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 686 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 687 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 688 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 689 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 690 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 691 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 692 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 693 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 694 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 695 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 696 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 697 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 698 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 699 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 700 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 701 |
+
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 702 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 703 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 704 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 705 |
+
checkpoint_1007000/target.encoder.layers_23.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp14658094100065076136.~1663960300090561~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16230492432462742032.~1663960300387076~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp16379259808268770224.~1663960300175113~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8894115837369550982.~1663960299882008~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/.zarray.__tmp8990031795982035122.~1663960299958555~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6a30f11bdff8e1816aa8440b48708a7446da358fd95ba3d84b3b27bcf99276d
|
| 3 |
+
size 7814640
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c1a110c98bb3427119464208aa12990acd3f8a2b434922707c48bd38d341566
|
| 3 |
+
size 7804931
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ed545265752dcae41736ed90081534d7ad8de9f5fbba2296ef835877d18c480
|
| 3 |
+
size 7800278
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbee059f811bc97efd1ccbbb5d4cffd2a0a4afccb117e6501d32b950b25544ae
|
| 3 |
+
size 7808749
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3a76999e096fddc05ef11a6524d091a644a407fa8e6e8bc87e6507c1c8f7e0b
|
| 3 |
+
size 7816034
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:266f15d2c82e2b840700c6af2be4d7452d18af52e40a6191cda70316dc799af8
|
| 3 |
+
size 7807960
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c47ac0776e59f0c18898557365714e809deb2b35a0df08c2d1451326e37e9cde
|
| 3 |
+
size 7814802
|
checkpoint_1007000/target.decoder.layers_1.self_attention.value.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ebc325295929c79465a68f4ea2b2fcab693b7ecc8b8b2677e445ace89a42300
|
| 3 |
+
size 7805270
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp11577145964185916981.~1663960300086131~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/.zarray.__tmp9374932084099255530.~1663960300271661~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.encoder_decoder_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfdc5b2eab1c9016cdd8fbc186a5a1bafac804b14ffe84aa7db25a2408b98a5c
|
| 3 |
+
size 7804594
|
checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.pre_mlp_layer_norm.scale/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11094273487534505663.~1663960300308880~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/.zarray.__tmp11832826128042483391.~1663960300601290~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ee6fe1523955408a6d544abb90f458a5c3fa3a42c181cf2e1bf65989eb4f18f
|
| 3 |
+
size 7812419
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:498b593babc6ec7160c59ee2a853be0f2289627025a534a120689602c08f027b
|
| 3 |
+
size 7821411
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2129698ef8523b5a379085029aeb0a4a7193eb7b24f6fb2afd3f55af5b133dd6
|
| 3 |
+
size 7825787
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a647768208da0a3a89ad492f46b29000b1d3fd62c2a73275e64576eec1c9bdb9
|
| 3 |
+
size 7810434
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:480ec40a32fa68b8423fc3f033a5b56456eb04805b29b0601cc9dafa143680e0
|
| 3 |
+
size 7822797
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e19c2b1cdc06085ba40ea79f0e2b64dd32f6c49707eeb717b88a39123e814b5e
|
| 3 |
+
size 7826665
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb3e300be6926f62c00a7dd5081aedebdaf6d32fa58c3d32d1ed6d4d35fbf19c
|
| 3 |
+
size 7817810
|
checkpoint_1007000/target.decoder.layers_9.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc4ba268ceab1c440fc7f1647fa7743326acdc8c56fff6b30af6ed914e15525b
|
| 3 |
+
size 7816754
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp11545495112761785230.~1663960300421208~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp13140827661821471681.~1663960300546318~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp15222983945689583177.~1663960300941715~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp162813558043179627.~1663960300688213~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp2276807198409161350.~1663960300385594~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp4389650834453463471.~1663960300423047~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/.zarray.__tmp8798756328389882663.~1663960300552107~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef0e14ac18af3fd3cea52c137befcb494d7b81d0252a5116d301ec76fe503e9c
|
| 3 |
+
size 7813809
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93505479e928d6d35502b9a871a1982265b51dba82b87a685f1c77f4ba78c364
|
| 3 |
+
size 7815254
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:252ca20d245d9180aed6c2a770be65f560be53252cb5e5d3ae2c3cb40bc677be
|
| 3 |
+
size 7813169
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf249000e51b7ef82c68e838dfc86f613445605b2e46bb258b75cbc1d472b103
|
| 3 |
+
size 7815115
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61f47f93552ec62e8aa7ab2b6f6c827f7e90f311f789d309aa8527b6029ea6bf
|
| 3 |
+
size 7814756
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b71bdecd28cacca5c1221e3aa215e70f273947dd4ed7296a10faa8909049ef5
|
| 3 |
+
size 7818533
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e553124a9d99ffc589ccb1358a6eac944930c4d98e5a7d97b4524c1caf4fcf7
|
| 3 |
+
size 7814298
|
checkpoint_1007000/target.encoder.layers_0.attention.query.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d21afbd5babd00fdd95cbf7fc03e030bb962e1bd4b96cd082e3b132f340b97c5
|
| 3 |
+
size 7813354
|
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp13440713807143523604.~1663960300863191~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_17.mlp.wi_1.kernel/.zarray.__tmp14332112127674379251.~1663960300421660~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|