| { | |
| "architectures": [ | |
| "GigaAMHF" | |
| ], | |
| "blank_id": 1024, | |
| "dtype": "float32", | |
| "encoder": { | |
| "conv_kernel_size": 31, | |
| "d_model": 256, | |
| "feat_in": 64, | |
| "ff_expansion_factor": 4, | |
| "n_heads": 4, | |
| "n_layers": 4, | |
| "self_attention_model": "rel_pos", | |
| "subsampling_factor": 4 | |
| }, | |
| "head": { | |
| "decoder": { | |
| "num_classes": 1025, | |
| "pred_hidden": 256, | |
| "pred_rnn_layers": 2 | |
| }, | |
| "joint": { | |
| "enc_hidden": 256, | |
| "joint_hidden": 512, | |
| "num_classes": 1025, | |
| "pred_hidden": 256 | |
| } | |
| }, | |
| "head_type": "rnnt", | |
| "transformers_version": "4.57.1" | |
| } | |