| { | |
| "cell_emb_style": "cls", | |
| "d_hid": 32, | |
| "d_model": 32, | |
| "do_dab": false, | |
| "do_mvc": true, | |
| "domain_spec_batchnorm": false, | |
| "dropout": 0.4, | |
| "ecs_threshold": 0.7, | |
| "explicit_zero_prob": true, | |
| "fast_transformer_backend": "flash", | |
| "input_emb_style": "continuous", | |
| "mvc_decoder_style": "inner product", | |
| "n_bins": 0, | |
| "n_cls": 14, | |
| "n_pert": 9854, | |
| "n_ps": 23, | |
| "nhead": 4, | |
| "nlayers": 2, | |
| "nlayers_cls": 3, | |
| "nlayers_pert": 3, | |
| "ntoken": 5014, | |
| "num_batch_labels": null, | |
| "pad_token": "<pad>", | |
| "pad_value": -2, | |
| "pert_dim": null, | |
| "pert_pad_id": null, | |
| "pre_norm": false, | |
| "pred_lochness_next": 100, | |
| "ps_decoder2_nlayer": 5, | |
| "use_batch_labels": false, | |
| "use_fast_transformer": true, | |
| "vocab": null | |
| } |