| { | |
| "architectures": [ | |
| "RecogModel" | |
| ], | |
| "cnn_dims": [ | |
| 32, | |
| 64, | |
| 128, | |
| 256 | |
| ], | |
| "dictionary_size": 14230, | |
| "down_kernelsize": [ | |
| [ | |
| 3, | |
| 3 | |
| ] | |
| ], | |
| "down_mbnetv3_kernelsize": [ | |
| [ | |
| 5, | |
| 5 | |
| ] | |
| ], | |
| "down_stride": [ | |
| 2 | |
| ], | |
| "dtype": "float32", | |
| "groupnorm_groups": 32, | |
| "in_channels": 3, | |
| "in_dim": 32, | |
| "mbnetv3_num_blocks": [ | |
| 1, | |
| 1, | |
| 1, | |
| 1 | |
| ], | |
| "mbnetv3_use_se": [ | |
| false, | |
| false, | |
| false, | |
| true | |
| ], | |
| "mhsa_expand": 4, | |
| "mhsa_heads": 2, | |
| "mhsa_intermediate_dim": 256, | |
| "mhsa_layers": 2, | |
| "model_type": "recog_model", | |
| "proj_intermediate_dim": 128, | |
| "res_scale_init": 1.0, | |
| "rope_theta": 10000.0, | |
| "transformers_version": "5.2.0", | |
| "vertical_kernelsize": [ | |
| [ | |
| 3, | |
| 3 | |
| ], | |
| [ | |
| 3, | |
| 3 | |
| ], | |
| [ | |
| 3, | |
| 3 | |
| ] | |
| ], | |
| "vertical_mbnetv3_kernelsize": [ | |
| [ | |
| 5, | |
| 5 | |
| ], | |
| [ | |
| 3, | |
| 3 | |
| ], | |
| [ | |
| 3, | |
| 3 | |
| ] | |
| ], | |
| "vertical_padding": [ | |
| [ | |
| 1, | |
| 1 | |
| ], | |
| [ | |
| 1, | |
| 1 | |
| ], | |
| [ | |
| 0, | |
| 1 | |
| ] | |
| ], | |
| "vertical_stride": [ | |
| 2, | |
| 2, | |
| 1 | |
| ] | |
| } | |