Commit ·
5327049
1
Parent(s): f89a69d
Upload part 20
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +50 -0
- checkpoint_1007000/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp14948618746349344249.~1663960300347124~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp15136683855597450498.~1663960300602933~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp16296990592820050215.~1663960300308916~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp1795439801511837984.~1663960300622622~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp2934560606035510395.~1663960300499931~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp5027861047478533928.~1663960300873901~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp9983986926069909442.~1663960300495889~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11247101534926358783.~1663960301029518~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11530036502559773605.~1663960300599558~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11533343011294122965.~1663960300685620~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp14471913516189679261.~1663960300548514~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp3767049663912894977.~1663960300826421~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp9965923146098643733.~1663960300822693~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp13791303887804226964.~1663960300222694~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp2424312097602939268.~1663960300500258~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp4016091107658042345.~1663960300308445~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp6740747515324763376.~1663960300502174~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp9565010299137988556.~1663960300384292~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp9946291196097989741.~1663960300131874~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray.__tmp10437380399954342908.~1663960300632967~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray.__tmp12479088181979160916.~1663960300685235~ +1 -0
.gitattributes
CHANGED
|
@@ -1029,3 +1029,53 @@ checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/
|
|
| 1029 |
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1030 |
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1031 |
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1029 |
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1030 |
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1031 |
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1032 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1033 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1034 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1035 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1036 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1037 |
+
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1038 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1039 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1040 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1041 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1042 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1043 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1044 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1045 |
+
checkpoint_1007000/target.encoder.layers_0.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1046 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1047 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1048 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1049 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1050 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1051 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1052 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1053 |
+
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1054 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
| 1055 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 1056 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 1057 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1058 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
| 1059 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
| 1060 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 1061 |
+
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
| 1062 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1063 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1064 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1065 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1066 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1067 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1068 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1069 |
+
checkpoint_1007000/target.encoder.layers_3.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1070 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1071 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1072 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1073 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
| 1074 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
| 1075 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 1076 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 1077 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
| 1078 |
+
checkpoint_1007000/target.encoder.layers_20.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 1079 |
+
checkpoint_1007000/target.encoder.layers_20.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
| 1080 |
+
checkpoint_1007000/target.encoder.layers_20.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 1081 |
+
checkpoint_1007000/target.encoder.layers_20.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (15.3 kB). View file
|
|
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp14948618746349344249.~1663960300347124~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp15136683855597450498.~1663960300602933~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp16296990592820050215.~1663960300308916~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp1795439801511837984.~1663960300622622~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp2934560606035510395.~1663960300499931~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp5027861047478533928.~1663960300873901~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/.zarray.__tmp9983986926069909442.~1663960300495889~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a7a74412fc829209a2f16c1ff9cdf4a798cfd7c26382c78aabc0ccde1e09dba
|
| 3 |
+
size 7809384
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5bc66bfcbd69e3bbd1d668e1e672dd5b21ef6125b83488fa2b95e04a8b3cdd6e
|
| 3 |
+
size 7813178
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c45485a6c86ef6dfe72086dc37bdbc7e808978cc347c9c18f56326d05a19ea09
|
| 3 |
+
size 7810279
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6213101b791ab427f828d096e60c31dd03326b9ebde3e2f536c3e687ed2a783f
|
| 3 |
+
size 7808163
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/4.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cebabc5703b27e1579592f650a0e5fe555a009d3782fe660127216d86602b29d
|
| 3 |
+
size 7808205
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/5.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21408ba9d0c4ab0f9ffee7860766f741c34937d14c1de3e047ee47508f4fe5d9
|
| 3 |
+
size 7812414
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/6.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2affbff2b06f1cdc906fd07ad83351e30563cf4ca429a5a8fce29659961b54
|
| 3 |
+
size 7811881
|
checkpoint_1007000/target.decoder.layers_15.encoder_decoder_attention.out.kernel/7.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e20274a0ff7779a76321f0704df5aa707400373af97ac1c9074ff693eec1481
|
| 3 |
+
size 7809296
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11247101534926358783.~1663960301029518~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11530036502559773605.~1663960300599558~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp11533343011294122965.~1663960300685620~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp14471913516189679261.~1663960300548514~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp3767049663912894977.~1663960300826421~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/.zarray.__tmp9965923146098643733.~1663960300822693~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee80ee001c782596d699c17ddf879c19e3c3064aacffcbfc20a282fa4107f724
|
| 3 |
+
size 19536618
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca10d7e6a1ad86ce256970d1666ec65dda418a1269773060bcd54d8f382a1f55
|
| 3 |
+
size 19537551
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d48cc5c497bb2e8aee4416eee09c5b88d83d25e795d5dbe48a030121139b21b
|
| 3 |
+
size 19536101
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b21eba00c592b1f2a2c452ea3fca5889c5defbc89aba633a879d3e7e609e455c
|
| 3 |
+
size 19536891
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c377bdd2d3b141eb2b735e8473854d56f80af5121d8964310582bc42e70db42e
|
| 3 |
+
size 19535776
|
checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7504b9a6a2fcbcbaff7b01a815aaa87b74b6273d55e57728123fc9e2bf8f412d
|
| 3 |
+
size 19535475
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp13791303887804226964.~1663960300222694~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp2424312097602939268.~1663960300500258~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp4016091107658042345.~1663960300308445~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp6740747515324763376.~1663960300502174~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp9565010299137988556.~1663960300384292~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/.zarray.__tmp9946291196097989741.~1663960300131874~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88009e7bc9f771e597cc8ba9f7431fa9a1375c310bcc9731991bf17609688992
|
| 3 |
+
size 19558251
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a8606aee62def3bc25f14d9b709ca9eb4c0904e053d0f623113fb4d683b0a84
|
| 3 |
+
size 19560024
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bbafb576740c8ecb7fe436ea2631bd94845c937a2dc63d5d95ab08433a7e913
|
| 3 |
+
size 19558342
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6b9f9cfffbafb2a27d620246b440a508caa5c1c121198192f2b5e8836e79ade
|
| 3 |
+
size 19555996
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2792cb0018eff19428b07326ecfca038b575658883e7822dd333487bcd68e06e
|
| 3 |
+
size 19560283
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0cff8a968ea6fd776e31960a07314cd9f7964aa3c5c23cff09d8ab7f00c9c6d0
|
| 3 |
+
size 19557699
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5578c4a21f4ff942a8a70677ea251f5eb600ea3901cb1a3b17bf22f44e08d525
|
| 3 |
+
size 19560521
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_1.kernel/0.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:edb6c943ee73f44f93f62c53c68d59390b2ac4e396b8874ab3cbc8317bafe74b
|
| 3 |
+
size 19558947
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray.__tmp10437380399954342908.~1663960300632967~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.encoder_decoder_attention.query.kernel/.zarray.__tmp12479088181979160916.~1663960300685235~
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|