diff --git a/.gitattributes b/.gitattributes index 2adbea2783e9d31261969d5f9a19ab7cf41db17b..c47a4a42f0ab1c2381545d05283717d1329c1784 100644 --- a/.gitattributes +++ b/.gitattributes @@ -1838,3 +1838,54 @@ checkpoint_1007000/target.encoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lf checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_7.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_8.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_13.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_13.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_6.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/.zarray b/checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..46a17786925fd95f6e6bc0c41a18b141457bb2ee --- /dev/null +++ b/checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.out.kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"