File size: 617 Bytes
cd8454d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 |
from fairseq.models.bart.model import mbart_large_architecture
from fairseq.models import register_model_architecture
@register_model_architecture("bart", "t2umbart_large")
def t2umbart_large_architecture(args):
args.no_scale_embedding = False
args.encoder_learned_pos = False
args.decoder_learned_pos = False
args.encoder_normalize_before = True
args.decoder_normalize_before = True
args.share_decoder_input_output_embed = True
args.share_all_embeddings = False
args.layernorm_embedding = False
args.no_token_positional_embeddings = False
mbart_large_architecture(args) |