{ "model_type": "wav2vec2", "architectures": [ "Wav2Vec2ForCTC" ], "hidden_size": 768, "num_hidden_layers": 12, "num_attention_heads": 12, "intermediate_size": 3072, "vocab_size": 32, "feat_extract_activation": "gelu", "epoch": 80 }