| { | |
| "_name_or_path": "sanchit-gandhi/whisper-medium-fleurs-lang-id", | |
| "activation_dropout": 0.0, | |
| "activation_function": "gelu", | |
| "apply_spec_augment": false, | |
| "architectures": [ | |
| "WhisperForAudioClassification" | |
| ], | |
| "attention_dropout": 0.0, | |
| "begin_suppress_tokens": [ | |
| 220, | |
| 50257 | |
| ], | |
| "bos_token_id": 50257, | |
| "classifier_proj_size": 256, | |
| "d_model": 1024, | |
| "decoder_attention_heads": 16, | |
| "decoder_ffn_dim": 4096, | |
| "decoder_layerdrop": 0.0, | |
| "decoder_layers": 24, | |
| "decoder_start_token_id": 50258, | |
| "dropout": 0.0, | |
| "encoder_attention_heads": 16, | |
| "encoder_ffn_dim": 4096, | |
| "encoder_layerdrop": 0.0, | |
| "encoder_layers": 24, | |
| "eos_token_id": 50257, | |
| "finetuning_task": "audio-classification", | |
| "forced_decoder_ids": [ | |
| [ | |
| 1, | |
| 50259 | |
| ], | |
| [ | |
| 2, | |
| 50359 | |
| ], | |
| [ | |
| 3, | |
| 50363 | |
| ] | |
| ], | |
| "id2label": { | |
| "0": "Afrikaans", | |
| "1": "Amharic", | |
| "2": "Arabic", | |
| "3": "Assamese", | |
| "4": "Asturian", | |
| "5": "Azerbaijani", | |
| "6": "Belarusian", | |
| "7": "Bulgarian", | |
| "8": "Bengali", | |
| "9": "Bosnian", | |
| "10": "Catalan", | |
| "11": "Cebuano", | |
| "12": "Sorani-Kurdish", | |
| "13": "Mandarin Chinese", | |
| "14": "Czech", | |
| "15": "Welsh", | |
| "16": "Danish", | |
| "17": "German", | |
| "18": "Greek", | |
| "19": "English", | |
| "20": "Spanish", | |
| "21": "Estonian", | |
| "22": "Persian", | |
| "23": "Fula", | |
| "24": "Finnish", | |
| "25": "Filipino", | |
| "26": "French", | |
| "27": "Irish", | |
| "28": "Galician", | |
| "29": "Gujarati", | |
| "30": "Hausa", | |
| "31": "Hebrew", | |
| "32": "Hindi", | |
| "33": "Croatian", | |
| "34": "Hungarian", | |
| "35": "Armenian", | |
| "36": "Indonesian", | |
| "37": "Igbo", | |
| "38": "Icelandic", | |
| "39": "Italian", | |
| "40": "Japanese", | |
| "41": "Javanese", | |
| "42": "Georgian", | |
| "43": "Kamba", | |
| "44": "Kabuverdianu", | |
| "45": "Kazakh", | |
| "46": "Khmer", | |
| "47": "Kannada", | |
| "48": "Korean", | |
| "49": "Kyrgyz", | |
| "50": "Luxembourgish", | |
| "51": "Ganda", | |
| "52": "Lingala", | |
| "53": "Lao", | |
| "54": "Lithuanian", | |
| "55": "Luo", | |
| "56": "Latvian", | |
| "57": "Maori", | |
| "58": "Macedonian", | |
| "59": "Malayalam", | |
| "60": "Mongolian", | |
| "61": "Marathi", | |
| "62": "Malay", | |
| "63": "Maltese", | |
| "64": "Burmese", | |
| "65": "Norwegian", | |
| "66": "Nepali", | |
| "67": "Dutch", | |
| "68": "Northern-Sotho", | |
| "69": "Nyanja", | |
| "70": "Occitan", | |
| "71": "Oromo", | |
| "72": "Oriya", | |
| "73": "Punjabi", | |
| "74": "Polish", | |
| "75": "Pashto", | |
| "76": "Portuguese", | |
| "77": "Romanian", | |
| "78": "Russian", | |
| "79": "Sindhi", | |
| "80": "Slovak", | |
| "81": "Slovenian", | |
| "82": "Shona", | |
| "83": "Somali", | |
| "84": "Serbian", | |
| "85": "Swedish", | |
| "86": "Swahili", | |
| "87": "Tamil", | |
| "88": "Telugu", | |
| "89": "Tajik", | |
| "90": "Thai", | |
| "91": "Turkish", | |
| "92": "Ukrainian", | |
| "93": "Umbundu", | |
| "94": "Urdu", | |
| "95": "Uzbek", | |
| "96": "Vietnamese", | |
| "97": "Wolof", | |
| "98": "Xhosa", | |
| "99": "Yoruba", | |
| "100": "Cantonese Chinese", | |
| "101": "Zulu" | |
| }, | |
| "init_std": 0.02, | |
| "is_encoder_decoder": true, | |
| "label2id": { | |
| "Afrikaans": "0", | |
| "Amharic": "1", | |
| "Arabic": "2", | |
| "Armenian": "35", | |
| "Assamese": "3", | |
| "Asturian": "4", | |
| "Azerbaijani": "5", | |
| "Belarusian": "6", | |
| "Bengali": "8", | |
| "Bosnian": "9", | |
| "Bulgarian": "7", | |
| "Burmese": "64", | |
| "Cantonese Chinese": "100", | |
| "Catalan": "10", | |
| "Cebuano": "11", | |
| "Croatian": "33", | |
| "Czech": "14", | |
| "Danish": "16", | |
| "Dutch": "67", | |
| "English": "19", | |
| "Estonian": "21", | |
| "Filipino": "25", | |
| "Finnish": "24", | |
| "French": "26", | |
| "Fula": "23", | |
| "Galician": "28", | |
| "Ganda": "51", | |
| "Georgian": "42", | |
| "German": "17", | |
| "Greek": "18", | |
| "Gujarati": "29", | |
| "Hausa": "30", | |
| "Hebrew": "31", | |
| "Hindi": "32", | |
| "Hungarian": "34", | |
| "Icelandic": "38", | |
| "Igbo": "37", | |
| "Indonesian": "36", | |
| "Irish": "27", | |
| "Italian": "39", | |
| "Japanese": "40", | |
| "Javanese": "41", | |
| "Kabuverdianu": "44", | |
| "Kamba": "43", | |
| "Kannada": "47", | |
| "Kazakh": "45", | |
| "Khmer": "46", | |
| "Korean": "48", | |
| "Kyrgyz": "49", | |
| "Lao": "53", | |
| "Latvian": "56", | |
| "Lingala": "52", | |
| "Lithuanian": "54", | |
| "Luo": "55", | |
| "Luxembourgish": "50", | |
| "Macedonian": "58", | |
| "Malay": "62", | |
| "Malayalam": "59", | |
| "Maltese": "63", | |
| "Mandarin Chinese": "13", | |
| "Maori": "57", | |
| "Marathi": "61", | |
| "Mongolian": "60", | |
| "Nepali": "66", | |
| "Northern-Sotho": "68", | |
| "Norwegian": "65", | |
| "Nyanja": "69", | |
| "Occitan": "70", | |
| "Oriya": "72", | |
| "Oromo": "71", | |
| "Pashto": "75", | |
| "Persian": "22", | |
| "Polish": "74", | |
| "Portuguese": "76", | |
| "Punjabi": "73", | |
| "Romanian": "77", | |
| "Russian": "78", | |
| "Serbian": "84", | |
| "Shona": "82", | |
| "Sindhi": "79", | |
| "Slovak": "80", | |
| "Slovenian": "81", | |
| "Somali": "83", | |
| "Sorani-Kurdish": "12", | |
| "Spanish": "20", | |
| "Swahili": "86", | |
| "Swedish": "85", | |
| "Tajik": "89", | |
| "Tamil": "87", | |
| "Telugu": "88", | |
| "Thai": "90", | |
| "Turkish": "91", | |
| "Ukrainian": "92", | |
| "Umbundu": "93", | |
| "Urdu": "94", | |
| "Uzbek": "95", | |
| "Vietnamese": "96", | |
| "Welsh": "15", | |
| "Wolof": "97", | |
| "Xhosa": "98", | |
| "Yoruba": "99", | |
| "Zulu": "101" | |
| }, | |
| "mask_feature_length": 10, | |
| "mask_feature_min_masks": 0, | |
| "mask_feature_prob": 0.0, | |
| "mask_time_length": 10, | |
| "mask_time_min_masks": 2, | |
| "mask_time_prob": 0.05, | |
| "max_length": 448, | |
| "max_source_positions": 1500, | |
| "max_target_positions": 448, | |
| "model_type": "whisper", | |
| "num_hidden_layers": 24, | |
| "num_mel_bins": 80, | |
| "pad_token_id": 50257, | |
| "scale_embedding": false, | |
| "suppress_tokens": [ | |
| 1, | |
| 2, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 14, | |
| 25, | |
| 26, | |
| 27, | |
| 28, | |
| 29, | |
| 31, | |
| 58, | |
| 59, | |
| 60, | |
| 61, | |
| 62, | |
| 63, | |
| 90, | |
| 91, | |
| 92, | |
| 93, | |
| 359, | |
| 503, | |
| 522, | |
| 542, | |
| 873, | |
| 893, | |
| 902, | |
| 918, | |
| 922, | |
| 931, | |
| 1350, | |
| 1853, | |
| 1982, | |
| 2460, | |
| 2627, | |
| 3246, | |
| 3253, | |
| 3268, | |
| 3536, | |
| 3846, | |
| 3961, | |
| 4183, | |
| 4667, | |
| 6585, | |
| 6647, | |
| 7273, | |
| 9061, | |
| 9383, | |
| 10428, | |
| 10929, | |
| 11938, | |
| 12033, | |
| 12331, | |
| 12562, | |
| 13793, | |
| 14157, | |
| 14635, | |
| 15265, | |
| 15618, | |
| 16553, | |
| 16604, | |
| 18362, | |
| 18956, | |
| 20075, | |
| 21675, | |
| 22520, | |
| 26130, | |
| 26161, | |
| 26435, | |
| 28279, | |
| 29464, | |
| 31650, | |
| 32302, | |
| 32470, | |
| 36865, | |
| 42863, | |
| 47425, | |
| 49870, | |
| 50254, | |
| 50258, | |
| 50360, | |
| 50361, | |
| 50362 | |
| ], | |
| "torch_dtype": "float16", | |
| "transformers_version": "4.30.0.dev0", | |
| "use_cache": true, | |
| "use_weighted_layer_sum": false, | |
| "vocab_size": 51865 | |
| } | |