Commit
·
b4094ee
1
Parent(s):
53c8883
Upload part 57
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +47 -0
- checkpoint_1007000/state.param_states.decoder.layers_16.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_16.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_17.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_17.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp11967534918600256712.~1663960300731352~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp12116594510275191610.~1663960300777514~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp12304348451064847213.~1663960300986530~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp13310934941979263747.~1663960300683726~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp18385801330057887807.~1663960300864813~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp634374725557603528.~1663960300547126~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp9485643803848471270.~1663960300384027~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp11447578929309787520.~1663960300385907~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp13648125117664041438.~1663960300940885~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp15507758539978721047.~1663960300686139~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp15512045140657548902.~1663960300622653~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp16501937074643373459.~1663960300601852~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp16947834950297711014.~1663960300547786~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp18289644900162670642.~1663960300609209~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/.zarray.__tmp13801572173648255722.~1663960300887609~ +1 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp10837781989906440906.~1663960300776894~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp13511791436579086504.~1663960300313098~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp16657987775539201437.~1663960300466125~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp16893554706971755259.~1663960300602777~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp2472678329142631110.~1663960300551443~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp3527000890062476291.~1663960300465947~ +1 -0
.gitattributes
CHANGED
|
@@ -2872,3 +2872,50 @@ checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.7 filt
|
|
| 2872 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2873 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2874 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2872 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2873 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2874 |
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2875 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2876 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2877 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2878 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2879 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2880 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2881 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2882 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2883 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2884 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2885 |
+
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2886 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 2887 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 2888 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 2889 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2890 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 2891 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 2892 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 2893 |
+
checkpoint_1007000/target.decoder.layers_4.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 2894 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2895 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2896 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2897 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2898 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2899 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2900 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2901 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2902 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2903 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2904 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2905 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2906 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2907 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2908 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2909 |
+
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2910 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2911 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2912 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2913 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 2914 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 2915 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 2916 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 2917 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 2918 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 2919 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 2920 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 2921 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_16.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_16.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15 kB). View file
|
|
|
checkpoint_1007000/state.param_states.decoder.layers_17.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_17.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (14.8 kB). View file
|
|
|
checkpoint_1007000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp11967534918600256712.~1663960300731352~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp12116594510275191610.~1663960300777514~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp12304348451064847213.~1663960300986530~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp13310934941979263747.~1663960300683726~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp18385801330057887807.~1663960300864813~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp634374725557603528.~1663960300547126~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/.zarray.__tmp9485643803848471270.~1663960300384027~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3d836b39ed578f7edf0b9fe98d83068fea71f75b81ce4cca771d54aadee5ccc
|
| 3 |
+
size 19506452
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fa033ea2c57b273ccf5468d7ef1f09cfe478f36ac7d4330bf6fcf3f25de112e
|
| 3 |
+
size 19507236
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9a0421906602246ef579d01ebeb1c0fb8f038d9ca08001c4e1e29f7380f8b7b
|
| 3 |
+
size 19507664
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2e99f08f08255f7a1f648a572cd3d2e8d08c11758e477781603cbde5bd79a13
|
| 3 |
+
size 19507627
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d474d5df59f5a036a7cc188834ddb8d9accb4cee1cf23ff558559ace2bbfcd22
|
| 3 |
+
size 19507420
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a408400aa3f727f0f468e4dc37dd065ce6744c83d46593815c08e63de308ccea
|
| 3 |
+
size 19506540
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40d031f5db4527d0a8fc393b2c49a069225ede0d60125ed016113f0a3ef5479a
|
| 3 |
+
size 19506735
|
checkpoint_1007000/target.decoder.layers_14.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29272554970915356cbd4d0b798c66a36fc56d9d86ec32b75a8caeeada3460c7
|
| 3 |
+
size 19507857
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp11447578929309787520.~1663960300385907~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp13648125117664041438.~1663960300940885~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp15507758539978721047.~1663960300686139~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp15512045140657548902.~1663960300622653~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp16501937074643373459.~1663960300601852~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp16947834950297711014.~1663960300547786~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/.zarray.__tmp18289644900162670642.~1663960300609209~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33aea22975e6a72c19cb86234f65d6b8a14555971d1a9e98057d0c51b71cf16c
|
| 3 |
+
size 7818941
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d8ff7a71bc6f7c403fd95dc5a1049edaf68f701c378ef5bbfb361872b784cff
|
| 3 |
+
size 7823316
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d25802d4b0667db41d1212d2b33dd74963fa32f15621b278a8e225f57dbf446d
|
| 3 |
+
size 7824612
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:752cddbb3cf0d8ca5d3bfdad778dc3a75a0980dd9aa3615ec567366afb79b135
|
| 3 |
+
size 7818837
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e73666d08f6f40e2d00401f255064036a4da12fcfc23ad8ac424352431644fb
|
| 3 |
+
size 7821153
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71ffa65f6057cbadab4693fef141cfc9da79a896bf1540d82175f805cbe2ac94
|
| 3 |
+
size 7821016
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c528010e7cd06f04a1a758a39071f2e9437dc395ae1110bd66f056570774f6a5
|
| 3 |
+
size 7837019
|
checkpoint_1007000/target.decoder.layers_16.self_attention.key.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d832fbded153b754ae43e1f7f2f4d70b96c5f889cbb30791a4d3d2b39cef57a8
|
| 3 |
+
size 7825264
|
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/.zarray.__tmp13801572173648255722.~1663960300887609~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3b70f03d049ccc5b2fb1e2db1494001879d408349f136a835449430720d69fb
|
| 3 |
+
size 7860277
|
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94274ccd666812d056b60842f8e0415017e51c49168cf24f3d81952a7be9f995
|
| 3 |
+
size 7809516
|
checkpoint_1007000/target.decoder.layers_16.self_attention.value.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a75a4c64f6f2540bb53db5da25a189428e9b0b9c40bd84b34b060f831b84f84d
|
| 3 |
+
size 7823651
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp10837781989906440906.~1663960300776894~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp13511791436579086504.~1663960300313098~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp16657987775539201437.~1663960300466125~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp16893554706971755259.~1663960300602777~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp2472678329142631110.~1663960300551443~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.self_attention.value.kernel/.zarray.__tmp3527000890062476291.~1663960300465947~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|