diff --git a/.gitattributes b/.gitattributes index fd2e7674554ce3c28e9374264888079649a425d6..93dafee28bf8b4cb295d5c4a7fa35454cf43e487 100644 --- a/.gitattributes +++ b/.gitattributes @@ -969,3 +969,63 @@ checkpoint_1007000/target.token_embedder.embedding/29.0 filter=lfs diff=lfs merg checkpoint_1007000/target.token_embedder.embedding/11.0 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.token_embedder.embedding/4.0 filter=lfs diff=lfs merge=lfs -text checkpoint_1007000/target.token_embedder.embedding/58.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/41.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/36.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/44.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/46.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/51.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/17.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/57.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/25.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/23.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/55.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/45.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/13.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/62.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/63.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/19.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/48.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/52.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/49.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/53.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/39.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/16.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/18.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/26.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/42.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/10.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.token_embedder.embedding/34.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_7.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.encoder.layers_0.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_19.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text +checkpoint_1007000/target.decoder.layers_18.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoint_1007000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray b/checkpoint_1007000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..2d0ddea1f0046008cb8eb77c5f75d9445443f01b --- /dev/null +++ b/checkpoint_1007000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray @@ -0,0 +1 @@ +{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"