{ "architectures": ["TransfoXLModel"], "model_type": "transfo-xl", "n_token": 267735, "d_embed": 512, "d_model": 512, "d_head": 64, "d_inner": 2048, "n_head": 8, "n_layer": 6, "mem_len": 512, "same_length": false, "clamp_len": -1, "dropout": 0.1, "dropatt": 0.1 }