Commit
·
80d4197
1
Parent(s):
e4b46a6
Upload part 55
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +54 -0
- checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp1105937564183758640.~1663960300385287~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp15260046325040061733.~1663960300015249~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp16338011193803630159.~1663960299960414~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp17973336360947397177.~1663960300229539~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp4456958716237740877.~1663960300269062~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp6550413818954659962.~1663960300089897~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp10566777187724039402.~1663960300502375~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp1347708317805751784.~1663960300822526~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp13560500597481309211.~1663960300548101~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3254274290136234671.~1663960300826412~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3740934665043393579.~1663960300938689~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp4268711832544831810.~1663960300729669~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp9074334274789578976.~1663960300622114~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray.__tmp17012158359598794522.~1663960300132054~ +1 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp13528873057967423628.~1663960300500187~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp1499336269700896617.~1663960300729091~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp17842300620868211239.~1663960300424968~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0 +3 -0
.gitattributes
CHANGED
|
@@ -2773,3 +2773,57 @@ checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.2 filter=lfs diff=
|
|
| 2773 |
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2774 |
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2775 |
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2773 |
checkpoint_1007000/target.encoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2774 |
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2775 |
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2776 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2777 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2778 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2779 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2780 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2781 |
+
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2782 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2783 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2784 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2785 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2786 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2787 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2788 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2789 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2790 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2791 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2792 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2793 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2794 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2795 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2796 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2797 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2798 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2799 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2800 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2801 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2802 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2803 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2804 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2805 |
+
checkpoint_1007000/target.encoder.layers_6.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2806 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2807 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2808 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2809 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2810 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2811 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2812 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2813 |
+
checkpoint_1007000/target.decoder.layers_4.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2814 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2815 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2816 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2817 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2818 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2819 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2820 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2821 |
+
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2822 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2823 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2824 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2825 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2826 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2827 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2828 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2829 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_9.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp1105937564183758640.~1663960300385287~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp15260046325040061733.~1663960300015249~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp16338011193803630159.~1663960299960414~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp17973336360947397177.~1663960300229539~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp4456958716237740877.~1663960300269062~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/.zarray.__tmp6550413818954659962.~1663960300089897~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14d66b8a9a7fd4f9fca0e71aa936ed0d599101321b99c1015b85ea5eb9fcad98
|
| 3 |
+
size 7815329
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:859f60411b6d2a62bba21fc946b24481b11a49538f563ea9ebd6e9bbef8e3c4b
|
| 3 |
+
size 7814419
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39d87eaf5730070828b8810551ac99870d193d974bb0c1f63eafea82417b5e75
|
| 3 |
+
size 7814004
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c5ecf8051338723fd2e506791022c8ce49d75051daaaf5575601aedaf18e59a
|
| 3 |
+
size 7814979
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aaeb62ffe69e8e3dc6d8004d75418abb2d1f9bb635b89c66daace3fff4564f46
|
| 3 |
+
size 7815022
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:358210a1c8fbafbea4046fee6a4cb63707c0d2c97ff24708bbf5562fd734c855
|
| 3 |
+
size 7812398
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0038f285a990bf58bcf449aa175e5f3dc0d02824ad8582236077f560c6c55f40
|
| 3 |
+
size 7813357
|
checkpoint_1007000/target.decoder.layers_10.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0031c644d7704833825c511a130eace4092be56785872cb86bf13175a714b938
|
| 3 |
+
size 7811733
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp10566777187724039402.~1663960300502375~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp1347708317805751784.~1663960300822526~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp13560500597481309211.~1663960300548101~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3254274290136234671.~1663960300826412~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp3740934665043393579.~1663960300938689~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp4268711832544831810.~1663960300729669~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/.zarray.__tmp9074334274789578976.~1663960300622114~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dad001c678352e4c543805f0c7c89996fc9335d8049ca42144477988bb944301
|
| 3 |
+
size 19547411
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af2c9811711cc482bbfaa4bea1b79aee6ecce6a9aac00d97229547c421102c86
|
| 3 |
+
size 19547290
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56df1744db0f6b3be75e5c70d388e0f37b43c9afde58038b29ff04e5a627f5a6
|
| 3 |
+
size 19547356
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37abfe7f832307d1cd3b4e9ed215928b25621fbee2fb31ccfde54e1174ac2a12
|
| 3 |
+
size 19546715
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:976d917a3b4857c36e3686b8b38bcfda604a7d1ae0a074ec0159487f80140450
|
| 3 |
+
size 19547102
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ca0a34a83edb4b4b0bcc4f63ee9177fc09b7b09ddc74c690a494bb9ee412745
|
| 3 |
+
size 19547223
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4569daf609e906701708f00b4325ed5f0438a367beffbcc748f585dd5048d204
|
| 3 |
+
size 19546611
|
checkpoint_1007000/target.decoder.layers_12.mlp.wo.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f017dfaf0f98ed36896c81ace50bb55de7164a6e2545bd6558360cc20930c19
|
| 3 |
+
size 19547073
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/.zarray.__tmp17012158359598794522.~1663960300132054~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79d5b97e5dffddf344aa1a4c4aba71b5b45462f682d8b9a3ad25bcb55e9ad0fd
|
| 3 |
+
size 7804234
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2a2690dec9b402469073c23bb92f0afe2cabf45bed4e5121a2c2329767736fd
|
| 3 |
+
size 7805172
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d05188293e8d66ccd355ac0cebce9dd73c2a1c781cd5f8ebad98d7f0d21143ab
|
| 3 |
+
size 7804864
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fbaa2868fd28a1fbb535827a4e53826da1f3a7db432389e4d6b9dc54513f676
|
| 3 |
+
size 7803327
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a3c69875e40a669ab8daae0f4af5af1720619f6612496ebec9617f4ce480b2f
|
| 3 |
+
size 7805047
|
checkpoint_1007000/target.decoder.layers_19.self_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e29169c980821ecdf9fc25ce4f1d04ea34a3173c5dbbb88878ba34e63422295
|
| 3 |
+
size 7803180
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp13528873057967423628.~1663960300500187~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp1499336269700896617.~1663960300729091~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/.zarray.__tmp17842300620868211239.~1663960300424968~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9eb87bf15d477db621dc2176ce414fa22fc1f00ba7de640d8d4e50b2adf65141
|
| 3 |
+
size 7810379
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9b0ed2565a589d24d3bedd1ad7a740c4cfed5cefa758e5ac8d2a0d81e90e970
|
| 3 |
+
size 7808995
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c4d56de663b52dff8cf1fb27b9e1bf7aed9661e52a1435ebde4f7cf373f78f0
|
| 3 |
+
size 7809281
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23ca5c0402acd6ab7c1efb59f6df9ff276b39e00803aa6778c0bba30ec514b42
|
| 3 |
+
size 7808493
|