diff --git a/.gitattributes b/.gitattributes index d63dd30314ffb0029dfaab328b9852b45fe2be10..4732342f2578b4efe8c695287a6f5ada43e3157c 100644 --- a/.gitattributes +++ b/.gitattributes @@ -1293,3 +1293,53 @@ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.value.kern checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_10.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_21.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_6.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_12.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/.zarray b/checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ddb67420063a3a02f5bd9b9eb19e636151970a4c --- /dev/null +++ b/checkpoint_1007000/target.decoder.layers_1.encoder_decoder_attention.key.kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"