| { | |
| "model_type": "small_audio_classifier_mlp", | |
| "torch_dtype": "float32", | |
| "input_dim": 6144, | |
| "num_labels": 10, | |
| "hidden_dims": [ | |
| 512, | |
| 256 | |
| ], | |
| "dropout": 0.2, | |
| "activation": "gelu", | |
| "task": "audio_classification", | |
| "outputs": { | |
| "logits": "float32[batch, num_labels]" | |
| }, | |
| "preprocessing": { | |
| "expected_input": "flattened log-mel spectrogram or other fixed-length audio features", | |
| "example_logmel": { | |
| "n_mels": 64, | |
| "n_frames": 96, | |
| "flatten": true, | |
| "input_dim": 6144 | |
| }, | |
| "note": "compute features outside the model; this model is intentionally tiny for assignments" | |
| }, | |
| "id2label": { | |
| "0": "class_0", | |
| "1": "class_1", | |
| "2": "class_2", | |
| "3": "class_3", | |
| "4": "class_4", | |
| "5": "class_5", | |
| "6": "class_6", | |
| "7": "class_7", | |
| "8": "class_8", | |
| "9": "class_9" | |
| }, | |
| "label2id": { | |
| "class_0": 0, | |
| "class_1": 1, | |
| "class_2": 2, | |
| "class_3": 3, | |
| "class_4": 4, | |
| "class_5": 5, | |
| "class_6": 6, | |
| "class_7": 7, | |
| "class_8": 8, | |
| "class_9": 9 | |
| }, | |
| "version": "0.1.0" | |
| } |