name: small type: ddit hidden_size: 768 cond_dim: 128 length: null length_range: '25,27,28,31,35,43-49' n_blocks: 12 n_heads: 12 scale_by_sigma: True dropout: 0.1 tie_word_embeddings: False