| { | |
| "cell_emb_style": "cls", | |
| "d_hid": 256, | |
| "d_model": 256, | |
| "do_dab": false, | |
| "do_mvc": true, | |
| "domain_spec_batchnorm": false, | |
| "dropout": 0.1, | |
| "ecs_threshold": 0.7, | |
| "explicit_zero_prob": true, | |
| "fast_transformer_backend": "flash", | |
| "input_emb_style": "continuous", | |
| "mvc_decoder_style": "inner product", | |
| "n_bins": 51, | |
| "n_cls": 20, | |
| "n_pert": 40, | |
| "n_ps": 1, | |
| "nhead": 8, | |
| "nlayers": 6, | |
| "nlayers_cls": 3, | |
| "nlayers_pert": 4, | |
| "ntoken": 36604, | |
| "num_batch_labels": null, | |
| "pad_token": "<pad>", | |
| "pad_value": -2, | |
| "pert_dim": null, | |
| "pert_pad_id": null, | |
| "pre_norm": false, | |
| "pred_lochness_next": false, | |
| "ps_decoder2_nlayer": 3, | |
| "use_batch_labels": false, | |
| "use_fast_transformer": true, | |
| "vocab": null | |
| } |