| { |
| "architectures": [ |
| "MertForSequenceClassification" |
| ], |
| "attention_probs_dropout_prob": 0.1, |
| "classifier_dropout": null, |
| "conv_kernel": [ |
| 10, |
| 3, |
| 3, |
| 3, |
| 3, |
| 2, |
| 2 |
| ], |
| "conv_stride": [ |
| 5, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2 |
| ], |
| "feature_extractor_type": "Wav2Vec2FeatureExtractor", |
| "feat_extract_activation": "gelu", |
| "feat_extract_norm": "group", |
| "feat_proj_dropout": 0.0, |
| "final_dropout": 0.1, |
| "hidden_act": "gelu", |
| "hidden_dropout_prob": 0.1, |
| "hidden_size": 768, |
| "initializer_range": 0.02, |
| "intermediate_size": 3072, |
| "layer_norm_eps": 1e-05, |
| "layerdrop": 0.1, |
| "mask_feature_length": 10, |
| "mask_feature_prob": 0.0, |
| "mask_time_length": 10, |
| "mask_time_prob": 0.05, |
| "model_type": "mert", |
| "num_attention_heads": 12, |
| "num_conv_pos_embeddings": 128, |
| "num_conv_pos_embedding_groups": 16, |
| "num_feat_extract_layers": 7, |
| "num_hidden_layers": 12, |
| "num_labels": 9, |
| "pad_token_id": 0, |
| "problem_type": "single_label_classification", |
| "transformers_version": "4.30.0", |
| "use_weighted_layer_sum": false, |
| "vocab_size": 32, |
| "id2label": { |
| "0": "ζ₯½γγ", |
| "1": "ηγδΈγγ", |
| "2": "ζγ", |
| "3": "γγγγγγ", |
| "4": "γγ©γγ©γγ", |
| "5": "ζ²γγ", |
| "6": "εγͺγ", |
| "7": "γͺγ©γγ―γΉγγ", |
| "8": "ηγγγ" |
| }, |
| "label2id": { |
| "ζ₯½γγ": 0, |
| "ηγδΈγγ": 1, |
| "ζγ": 2, |
| "γγγγγγ": 3, |
| "γγ©γγ©γγ": 4, |
| "ζ²γγ": 5, |
| "εγͺγ": 6, |
| "γͺγ©γγ―γΉγγ": 7, |
| "ηγγγ": 8 |
| } |
| } |
|
|