Initial model upload

Browse files

Files changed (7) hide show

.ipynb_checkpoints/README-checkpoint.md +203 -0
.ipynb_checkpoints/config-checkpoint.json +180 -0
README.md +203 -0
config.json +180 -0
model.safetensors +3 -0
preprocessor_config.json +9 -0
trainer_state.json +552 -0

.ipynb_checkpoints/README-checkpoint.md ADDED Viewed

	@@ -0,0 +1,203 @@

+---
+language:
+  - ak  # Akuapim Twi
+  - tw  # Asante Twi
+  - aeb # Tunisian Arabic
+  - af  # Afrikaans
+  - am  # Amharic
+  - ar  # Arabic
+  - bas # Basaa
+  - bem # Bemba
+  - dav # Taita
+  - dyu # Dyula
+  - en  # English
+  - pcm # Nigerian Pidgin
+  - ee  # Ewe
+  - fat # Fanti
+  - fon # Fon
+  - fuc # Pulaar
+  - ff  # Pular
+  - gaa # Ga
+  - ha  # Hausa
+  - ig  # Igbo
+  - kab # Kabyle
+  - rw  # Kinyarwanda
+  - kln # Kalenjin
+  - ln  # Lingala
+  - loz # Lozi
+  - lg  # Luganda
+  - luo # Luo
+  - mlq # Western Maninkakan
+  - nr  # South Ndebele
+  - nso # Northern Sotho
+  - ny  # Chichewa
+  - st  # Southern Sotho
+  - srr # Serer
+  - ss  # Swati
+  - sus # Susu
+  - sw  # Kiswahili/Swahili
+  - tig # Tigre
+  - ti  # Tigrinya
+  - toi # Tonga
+  - tn  # Tswana
+  - ts  # Tsonga
+  - tw  # Twi
+  - ve  # Venda
+  - wo  # Wolof
+  - xh  # Xhosa
+  - yo  # Yoruba
+  - zgh # Standard Moroccan Tamazight
+  - zu  # Zulu
+license: cc-by-4.0
+tags:
+  - automatic-speech-recognition
+  - audio
+  - speech
+  - african-languages
+  - multilingual
+  - simba
+  - low-resource
+  - speech-recognition
+  - asr
+  - spoken-language-identification
+  - language-identification
+datasets:
+  - UBC-NLP/SimbaBench
+metrics:
+  - wer
+  - cer
+  - accuracy
+library_name: transformers
+pipeline_tag: automatic-speech-recognition
+---
+<div align="center">
+<img src="https://africa.dlnlp.ai/simba/images/VoC_logo.png" alt="VoC Logo">
+[![EMNLP 2025 Paper](https://img.shields.io/badge/EMNLP_2025-Paper-B31B1B?style=for-the-badge&logo=arxiv&logoColor=B31B1B&labelColor=FFCDD2)](https://aclanthology.org/2025.emnlp-main.559/)
+[![Official Website](https://img.shields.io/badge/Official-Website-2EA44F?style=for-the-badge&logo=googlechrome&logoColor=2EA44F&labelColor=C8E6C9)](https://africa.dlnlp.ai/simba/)
+[![SimbaBench](https://img.shields.io/badge/SimbaBench-Benchmark-8A2BE2?style=for-the-badge&logo=googlecharts&logoColor=8A2BE2&labelColor=E1BEE7)](https://huggingface.co/spaces/UBC-NLP/SimbaBench)
+[![GitHub Repository](https://img.shields.io/badge/GitHub-Repository-181717?style=for-the-badge&logo=github&logoColor=181717&labelColor=E0E0E0)](https://github.com/UBC-NLP/simba)
+[![Hugging Face](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Models-FFD21E?style=for-the-badge&logoColor=181717&labelColor=FFF9C4)](https://huggingface.co/collections/UBC-NLP/simba-speech-series)
+[![Hugging Face Dataset](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Dataset-FFD21E?style=for-the-badge&logoColor=181717&labelColor=FFF9C4)](https://huggingface.co/datasets/UBC-NLP/SimbaBench_dataset)
+</div>
+## *Bridging the Digital Divide for African AI*
+**Voice of a Continent** is a comprehensive open-source ecosystem designed to bring African languages to the forefront of artificial intelligence. By providing a unified suite of benchmarking tools and state-of-the-art models, we ensure that the future of speech technology is inclusive, representative, and accessible to over a billion people.
+## Best-in-Class Multilingual Models
+<img src="https://africa.dlnlp.ai/simba/images/VoC_simba" alt="VoC Simba Models Logo">
+Introduced in our EMNLP 2025 paper *[Voice of a Continent](https://aclanthology.org/2025.emnlp-main.559/)*, the **Simba Series** represents the current state-of-the-art for African speech AI.
+- **Unified Suite:** Models optimized for African languages.
+- **Superior Accuracy:** Outperforms generic multilingual models by leveraging SimbaBench's high-quality, domain-diverse datasets.
+- **Multitask Capability:** Designed for high performance in ASR (Automatic Speech Recognition) and TTS (Text-to-Speech).
+- **Inclusion-First:** Specifically built to mitigate the "digital divide" by empowering speakers of underrepresented languages.
+The **Simba** family consists of state-of-the-art models fine-tuned using SimbaBench. These models achieve superior performance by leveraging dataset quality, domain diversity, and language family relationships.
+### 🔍 Simba-SLID (Spoken Language Identification)
+* **🎯 Task:** `Spoken Language Identification` — Intelligent input routing.
+* **🌍 Language Coverage (49 African languages)**
+  > **Akuapim Twi** (`Akuapim-twi`), **Asante Twi** (`Asante-twi`), **Tunisian Arabic** (`aeb`), **Afrikaans** (`afr`), **Amharic** (`amh`), **Arabic** (`ara`), **Basaa** (`bas`), **Bemba** (`bem`), **Taita** (`dav`), **Dyula** (`dyu`), **English** (`eng`), **Nigerian Pidgin** (`eng-zul`), **Ewe** (`ewe`), **Fanti** (`fat`), **Fon** (`fon`), **Pulaar** (`fuc`), **Pular** (`fuf`), **Ga** (`gaa`), **Hausa** (`hau`), **Igbo** (`ibo`), **Kabyle** (`kab`), **Kinyarwanda** (`kin`), **Kalenjin** (`kln`), **Lingala** (`lin`), **Lozi** (`loz`), **Luganda** (`lug`), **Luo** (`luo`), **Western Maninkakan** (`mlq`), **South Ndebele** (`nbl`), **Northern Sotho** (`nso`), **Chichewa** (`nya`), **Southern Sotho** (`sot`), **Serer** (`srr`), **Swati** (`ssw`), **Susu** (`sus`), **Kiswahili** (`swa`), **Swahili** (`swh`), **Tigre** (`tig`), **Tigrinya** (`tir`), **Tonga** (`toi`), **Tswana** (`tsn`), **Tsonga** (`tso`), **Twi** (`twi`), **Venda** (`ven`), **Wolof** (`wol`), **Xhosa** (`xho`), **Yoruba** (`yor`), **Standard Moroccan Tamazight** (`zgh`), **Zulu** (`zul`)
+| **SLID Model** | **Architecture** | **Hugging Face Card** | **Status** |
+| :--- | :--- | :---: | :---: |
+| **Simba-SLID-49** 🔍 | HuBERT | 🤗 [https://huggingface.co/UBC-NLP/Simba-SLIS-49](https://huggingface.co/UBC-NLPSimba-SLIS-49) | ✅ Released |
+**🧩 Usage Example**
+You can easily run inference using the Hugging Face `transformers` library.
+```python
+from transformers import (
+    HubertForSequenceClassification,
+    AutoFeatureExtractor,
+    AutoProcessor
+)
+import torch
+model_id = "UBC-NLP/Simba-SLIS_49"
+model = HubertForSequenceClassification.from_pretrained(model_id).to("cuda")
+# HuBERT models can use either processor or feature extractor depending on the specific model
+try:
+    processor = AutoProcessor.from_pretrained(model_id)
+    print("Loaded Simba-SLIS_49 model with AutoProcessor")
+except:
+    processor = AutoFeatureExtractor.from_pretrained(model_id)
+    print("Loaded Simba-SLIS_49 model with AutoFeatureExtractor")
+# Optimize model for inference
+model.eval()
+audio_arrays = [] ### add your audio array
+sample_rate=16000
+nputs = processor(audio_arrays, sampling_rate=sample_rate, return_tensors="pt", padding=True).to("cuda")
+# Different models might have slightly different input formats
+try:
+    logits = model(**inputs).logits
+except Exception as e:
+    # Try alternative input format if the first attempt fails
+    if "input_values" in inputs:
+        logits = model(input_values=inputs.input_values).logits
+    else:
+        raise e
+# Calculate softmax probabilities
+probs = torch.nn.functional.softmax(logits, dim=-1)
+# Get the maximum probability (confidence) for each prediction
+confidence_values, pred_ids = torch.max(probs, dim=-1)
+# Convert to Python lists
+pred_ids = pred_ids.tolist()
+confidence_values = confidence_values.cpu().tolist()
+# Get labels from IDs
+pred_labels = [model.config.id2label[i] for i in pred_ids]
+print(pred_labels, confidence_values)
+```
+## Citation
+If you use the Simba models or SimbaBench  benchmark for your scientific publication, or if you find the resources in this website useful, please cite our paper.
+```bibtex
+@inproceedings{elmadany-etal-2025-voice,
+    title = "Voice of a Continent: Mapping {A}frica{'}s Speech Technology Frontier",
+    author = "Elmadany, AbdelRahim A.  and
+      Kwon, Sang Yun  and
+      Toyin, Hawau Olamide  and
+      Alcoba Inciarte, Alcides  and
+      Aldarmaki, Hanan  and
+      Abdul-Mageed, Muhammad",
+    editor = "Christodoulopoulos, Christos  and
+      Chakraborty, Tanmoy  and
+      Rose, Carolyn  and
+      Peng, Violet",
+    booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
+    month = nov,
+    year = "2025",
+    address = "Suzhou, China",
+    publisher = "Association for Computational Linguistics",
+    url = "https://aclanthology.org/2025.emnlp-main.559/",
+    doi = "10.18653/v1/2025.emnlp-main.559",
+    pages = "11039--11061",
+    ISBN = "979-8-89176-332-6",
+}
+```

.ipynb_checkpoints/config-checkpoint.json ADDED Viewed

	@@ -0,0 +1,180 @@

+{
+  "_name_or_path": "ajesujoba/AfriHuBERT",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_pos_batch_norm": false,
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_proj_layer_norm": true,
+  "final_dropout": 0.1,
+  "finetuning_task": "audio-classification",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Akuapim-twi",
+    "1": "Asante-twi",
+    "10": "eng",
+    "11": "eng-zul",
+    "12": "ewe",
+    "13": "fat",
+    "14": "fon",
+    "15": "fuc",
+    "16": "fuf",
+    "17": "gaa",
+    "18": "hau",
+    "19": "ibo",
+    "2": "aeb",
+    "20": "kab",
+    "21": "kin",
+    "22": "kln",
+    "23": "lin",
+    "24": "loz",
+    "25": "lug",
+    "26": "luo",
+    "27": "mlq",
+    "28": "nbl",
+    "29": "nso",
+    "3": "afr",
+    "30": "nya",
+    "31": "sot",
+    "32": "srr",
+    "33": "ssw",
+    "34": "sus",
+    "35": "swa",
+    "36": "swh",
+    "37": "tig",
+    "38": "tir",
+    "39": "toi",
+    "4": "amh",
+    "40": "tsn",
+    "41": "tso",
+    "42": "twi",
+    "43": "ven",
+    "44": "wol",
+    "45": "xho",
+    "46": "yor",
+    "47": "zgh",
+    "48": "zul",
+    "5": "ara",
+    "6": "bas",
+    "7": "bem",
+    "8": "dav",
+    "9": "dyu"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Akuapim-twi": "0",
+    "Asante-twi": "1",
+    "aeb": "2",
+    "afr": "3",
+    "amh": "4",
+    "ara": "5",
+    "bas": "6",
+    "bem": "7",
+    "dav": "8",
+    "dyu": "9",
+    "eng": "10",
+    "eng-zul": "11",
+    "ewe": "12",
+    "fat": "13",
+    "fon": "14",
+    "fuc": "15",
+    "fuf": "16",
+    "gaa": "17",
+    "hau": "18",
+    "ibo": "19",
+    "kab": "20",
+    "kin": "21",
+    "kln": "22",
+    "lin": "23",
+    "loz": "24",
+    "lug": "25",
+    "luo": "26",
+    "mlq": "27",
+    "nbl": "28",
+    "nso": "29",
+    "nya": "30",
+    "sot": "31",
+    "srr": "32",
+    "ssw": "33",
+    "sus": "34",
+    "swa": "35",
+    "swh": "36",
+    "tig": "37",
+    "tir": "38",
+    "toi": "39",
+    "tsn": "40",
+    "tso": "41",
+    "twi": "42",
+    "ven": "43",
+    "wol": "44",
+    "xho": "45",
+    "yor": "46",
+    "zgh": "47",
+    "zul": "48"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.1,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

README.md ADDED Viewed

	@@ -0,0 +1,203 @@

+---
+language:
+  - ak  # Akuapim Twi
+  - tw  # Asante Twi
+  - aeb # Tunisian Arabic
+  - af  # Afrikaans
+  - am  # Amharic
+  - ar  # Arabic
+  - bas # Basaa
+  - bem # Bemba
+  - dav # Taita
+  - dyu # Dyula
+  - en  # English
+  - pcm # Nigerian Pidgin
+  - ee  # Ewe
+  - fat # Fanti
+  - fon # Fon
+  - fuc # Pulaar
+  - ff  # Pular
+  - gaa # Ga
+  - ha  # Hausa
+  - ig  # Igbo
+  - kab # Kabyle
+  - rw  # Kinyarwanda
+  - kln # Kalenjin
+  - ln  # Lingala
+  - loz # Lozi
+  - lg  # Luganda
+  - luo # Luo
+  - mlq # Western Maninkakan
+  - nr  # South Ndebele
+  - nso # Northern Sotho
+  - ny  # Chichewa
+  - st  # Southern Sotho
+  - srr # Serer
+  - ss  # Swati
+  - sus # Susu
+  - sw  # Kiswahili/Swahili
+  - tig # Tigre
+  - ti  # Tigrinya
+  - toi # Tonga
+  - tn  # Tswana
+  - ts  # Tsonga
+  - tw  # Twi
+  - ve  # Venda
+  - wo  # Wolof
+  - xh  # Xhosa
+  - yo  # Yoruba
+  - zgh # Standard Moroccan Tamazight
+  - zu  # Zulu
+license: cc-by-4.0
+tags:
+  - automatic-speech-recognition
+  - audio
+  - speech
+  - african-languages
+  - multilingual
+  - simba
+  - low-resource
+  - speech-recognition
+  - asr
+  - spoken-language-identification
+  - language-identification
+datasets:
+  - UBC-NLP/SimbaBench
+metrics:
+  - wer
+  - cer
+  - accuracy
+library_name: transformers
+pipeline_tag: automatic-speech-recognition
+---
+<div align="center">
+<img src="https://africa.dlnlp.ai/simba/images/VoC_logo.png" alt="VoC Logo">
+[![EMNLP 2025 Paper](https://img.shields.io/badge/EMNLP_2025-Paper-B31B1B?style=for-the-badge&logo=arxiv&logoColor=B31B1B&labelColor=FFCDD2)](https://aclanthology.org/2025.emnlp-main.559/)
+[![Official Website](https://img.shields.io/badge/Official-Website-2EA44F?style=for-the-badge&logo=googlechrome&logoColor=2EA44F&labelColor=C8E6C9)](https://africa.dlnlp.ai/simba/)
+[![SimbaBench](https://img.shields.io/badge/SimbaBench-Benchmark-8A2BE2?style=for-the-badge&logo=googlecharts&logoColor=8A2BE2&labelColor=E1BEE7)](https://huggingface.co/spaces/UBC-NLP/SimbaBench)
+[![GitHub Repository](https://img.shields.io/badge/GitHub-Repository-181717?style=for-the-badge&logo=github&logoColor=181717&labelColor=E0E0E0)](https://github.com/UBC-NLP/simba)
+[![Hugging Face](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Models-FFD21E?style=for-the-badge&logoColor=181717&labelColor=FFF9C4)](https://huggingface.co/collections/UBC-NLP/simba-speech-series)
+[![Hugging Face Dataset](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Dataset-FFD21E?style=for-the-badge&logoColor=181717&labelColor=FFF9C4)](https://huggingface.co/datasets/UBC-NLP/SimbaBench_dataset)
+</div>
+## *Bridging the Digital Divide for African AI*
+**Voice of a Continent** is a comprehensive open-source ecosystem designed to bring African languages to the forefront of artificial intelligence. By providing a unified suite of benchmarking tools and state-of-the-art models, we ensure that the future of speech technology is inclusive, representative, and accessible to over a billion people.
+## Best-in-Class Multilingual Models
+<img src="https://africa.dlnlp.ai/simba/images/VoC_simba" alt="VoC Simba Models Logo">
+Introduced in our EMNLP 2025 paper *[Voice of a Continent](https://aclanthology.org/2025.emnlp-main.559/)*, the **Simba Series** represents the current state-of-the-art for African speech AI.
+- **Unified Suite:** Models optimized for African languages.
+- **Superior Accuracy:** Outperforms generic multilingual models by leveraging SimbaBench's high-quality, domain-diverse datasets.
+- **Multitask Capability:** Designed for high performance in ASR (Automatic Speech Recognition) and TTS (Text-to-Speech).
+- **Inclusion-First:** Specifically built to mitigate the "digital divide" by empowering speakers of underrepresented languages.
+The **Simba** family consists of state-of-the-art models fine-tuned using SimbaBench. These models achieve superior performance by leveraging dataset quality, domain diversity, and language family relationships.
+### 🔍 Simba-SLID (Spoken Language Identification)
+* **🎯 Task:** `Spoken Language Identification` — Intelligent input routing.
+* **🌍 Language Coverage (49 African languages)**
+  > **Akuapim Twi** (`Akuapim-twi`), **Asante Twi** (`Asante-twi`), **Tunisian Arabic** (`aeb`), **Afrikaans** (`afr`), **Amharic** (`amh`), **Arabic** (`ara`), **Basaa** (`bas`), **Bemba** (`bem`), **Taita** (`dav`), **Dyula** (`dyu`), **English** (`eng`), **Nigerian Pidgin** (`eng-zul`), **Ewe** (`ewe`), **Fanti** (`fat`), **Fon** (`fon`), **Pulaar** (`fuc`), **Pular** (`fuf`), **Ga** (`gaa`), **Hausa** (`hau`), **Igbo** (`ibo`), **Kabyle** (`kab`), **Kinyarwanda** (`kin`), **Kalenjin** (`kln`), **Lingala** (`lin`), **Lozi** (`loz`), **Luganda** (`lug`), **Luo** (`luo`), **Western Maninkakan** (`mlq`), **South Ndebele** (`nbl`), **Northern Sotho** (`nso`), **Chichewa** (`nya`), **Southern Sotho** (`sot`), **Serer** (`srr`), **Swati** (`ssw`), **Susu** (`sus`), **Kiswahili** (`swa`), **Swahili** (`swh`), **Tigre** (`tig`), **Tigrinya** (`tir`), **Tonga** (`toi`), **Tswana** (`tsn`), **Tsonga** (`tso`), **Twi** (`twi`), **Venda** (`ven`), **Wolof** (`wol`), **Xhosa** (`xho`), **Yoruba** (`yor`), **Standard Moroccan Tamazight** (`zgh`), **Zulu** (`zul`)
+| **SLID Model** | **Architecture** | **Hugging Face Card** | **Status** |
+| :--- | :--- | :---: | :---: |
+| **Simba-SLID-49** 🔍 | HuBERT | 🤗 [https://huggingface.co/UBC-NLP/Simba-SLIS-49](https://huggingface.co/UBC-NLPSimba-SLIS-49) | ✅ Released |
+**🧩 Usage Example**
+You can easily run inference using the Hugging Face `transformers` library.
+```python
+from transformers import (
+    HubertForSequenceClassification,
+    AutoFeatureExtractor,
+    AutoProcessor
+)
+import torch
+model_id = "UBC-NLP/Simba-SLIS_49"
+model = HubertForSequenceClassification.from_pretrained(model_id).to("cuda")
+# HuBERT models can use either processor or feature extractor depending on the specific model
+try:
+    processor = AutoProcessor.from_pretrained(model_id)
+    print("Loaded Simba-SLIS_49 model with AutoProcessor")
+except:
+    processor = AutoFeatureExtractor.from_pretrained(model_id)
+    print("Loaded Simba-SLIS_49 model with AutoFeatureExtractor")
+# Optimize model for inference
+model.eval()
+audio_arrays = [] ### add your audio array
+sample_rate=16000
+nputs = processor(audio_arrays, sampling_rate=sample_rate, return_tensors="pt", padding=True).to("cuda")
+# Different models might have slightly different input formats
+try:
+    logits = model(**inputs).logits
+except Exception as e:
+    # Try alternative input format if the first attempt fails
+    if "input_values" in inputs:
+        logits = model(input_values=inputs.input_values).logits
+    else:
+        raise e
+# Calculate softmax probabilities
+probs = torch.nn.functional.softmax(logits, dim=-1)
+# Get the maximum probability (confidence) for each prediction
+confidence_values, pred_ids = torch.max(probs, dim=-1)
+# Convert to Python lists
+pred_ids = pred_ids.tolist()
+confidence_values = confidence_values.cpu().tolist()
+# Get labels from IDs
+pred_labels = [model.config.id2label[i] for i in pred_ids]
+print(pred_labels, confidence_values)
+```
+## Citation
+If you use the Simba models or SimbaBench  benchmark for your scientific publication, or if you find the resources in this website useful, please cite our paper.
+```bibtex
+@inproceedings{elmadany-etal-2025-voice,
+    title = "Voice of a Continent: Mapping {A}frica{'}s Speech Technology Frontier",
+    author = "Elmadany, AbdelRahim A.  and
+      Kwon, Sang Yun  and
+      Toyin, Hawau Olamide  and
+      Alcoba Inciarte, Alcides  and
+      Aldarmaki, Hanan  and
+      Abdul-Mageed, Muhammad",
+    editor = "Christodoulopoulos, Christos  and
+      Chakraborty, Tanmoy  and
+      Rose, Carolyn  and
+      Peng, Violet",
+    booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
+    month = nov,
+    year = "2025",
+    address = "Suzhou, China",
+    publisher = "Association for Computational Linguistics",
+    url = "https://aclanthology.org/2025.emnlp-main.559/",
+    doi = "10.18653/v1/2025.emnlp-main.559",
+    pages = "11039--11061",
+    ISBN = "979-8-89176-332-6",
+}
+```

config.json ADDED Viewed

	@@ -0,0 +1,180 @@

+{
+  "_name_or_path": "ajesujoba/AfriHuBERT",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_pos_batch_norm": false,
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_proj_layer_norm": true,
+  "final_dropout": 0.1,
+  "finetuning_task": "audio-classification",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Akuapim-twi",
+    "1": "Asante-twi",
+    "10": "eng",
+    "11": "eng-zul",
+    "12": "ewe",
+    "13": "fat",
+    "14": "fon",
+    "15": "fuc",
+    "16": "fuf",
+    "17": "gaa",
+    "18": "hau",
+    "19": "ibo",
+    "2": "aeb",
+    "20": "kab",
+    "21": "kin",
+    "22": "kln",
+    "23": "lin",
+    "24": "loz",
+    "25": "lug",
+    "26": "luo",
+    "27": "mlq",
+    "28": "nbl",
+    "29": "nso",
+    "3": "afr",
+    "30": "nya",
+    "31": "sot",
+    "32": "srr",
+    "33": "ssw",
+    "34": "sus",
+    "35": "swa",
+    "36": "swh",
+    "37": "tig",
+    "38": "tir",
+    "39": "toi",
+    "4": "amh",
+    "40": "tsn",
+    "41": "tso",
+    "42": "twi",
+    "43": "ven",
+    "44": "wol",
+    "45": "xho",
+    "46": "yor",
+    "47": "zgh",
+    "48": "zul",
+    "5": "ara",
+    "6": "bas",
+    "7": "bem",
+    "8": "dav",
+    "9": "dyu"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Akuapim-twi": "0",
+    "Asante-twi": "1",
+    "aeb": "2",
+    "afr": "3",
+    "amh": "4",
+    "ara": "5",
+    "bas": "6",
+    "bem": "7",
+    "dav": "8",
+    "dyu": "9",
+    "eng": "10",
+    "eng-zul": "11",
+    "ewe": "12",
+    "fat": "13",
+    "fon": "14",
+    "fuc": "15",
+    "fuf": "16",
+    "gaa": "17",
+    "hau": "18",
+    "ibo": "19",
+    "kab": "20",
+    "kin": "21",
+    "kln": "22",
+    "lin": "23",
+    "loz": "24",
+    "lug": "25",
+    "luo": "26",
+    "mlq": "27",
+    "nbl": "28",
+    "nso": "29",
+    "nya": "30",
+    "sot": "31",
+    "srr": "32",
+    "ssw": "33",
+    "sus": "34",
+    "swa": "35",
+    "swh": "36",
+    "tig": "37",
+    "tir": "38",
+    "toi": "39",
+    "tsn": "40",
+    "tso": "41",
+    "twi": "42",
+    "ven": "43",
+    "wol": "44",
+    "xho": "45",
+    "yor": "46",
+    "zgh": "47",
+    "zul": "48"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.1,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b093d79e77272669d34041d5b010e0d79c6fa0e0222b94cf300f24019786eb14
+size 378350268

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,552 @@

+{
+  "best_metric": 0.4363306793570824,
+  "best_model_checkpoint": "./outputs_slid/ajesujoba/AfriHuBERT/checkpoint-1830",
+  "epoch": 29.99591836734694,
+  "eval_steps": 500,
+  "global_step": 5490,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9959183673469387,
+      "grad_norm": 0.7721740007400513,
+      "learning_rate": 1.6666666666666667e-05,
+      "loss": 3.7874,
+      "step": 183
+    },
+    {
+      "epoch": 0.9959183673469387,
+      "eval_accuracy": 0.04349865165904561,
+      "eval_f1": 0.004599781789327515,
+      "eval_loss": 3.9047515392303467,
+      "eval_runtime": 28.6696,
+      "eval_samples_per_second": 297.493,
+      "eval_steps_per_second": 0.593,
+      "step": 183
+    },
+    {
+      "epoch": 1.9959183673469387,
+      "grad_norm": 0.8705180883407593,
+      "learning_rate": 3.3333333333333335e-05,
+      "loss": 3.0785,
+      "step": 366
+    },
+    {
+      "epoch": 1.9959183673469387,
+      "eval_accuracy": 0.16649079610739828,
+      "eval_f1": 0.07176290896776823,
+      "eval_loss": 3.3783769607543945,
+      "eval_runtime": 17.2721,
+      "eval_samples_per_second": 493.804,
+      "eval_steps_per_second": 0.984,
+      "step": 366
+    },
+    {
+      "epoch": 2.9959183673469387,
+      "grad_norm": 1.0882235765457153,
+      "learning_rate": 5e-05,
+      "loss": 1.9687,
+      "step": 549
+    },
+    {
+      "epoch": 2.9959183673469387,
+      "eval_accuracy": 0.41739946066361827,
+      "eval_f1": 0.23146127598121502,
+      "eval_loss": 2.4746670722961426,
+      "eval_runtime": 18.0262,
+      "eval_samples_per_second": 473.145,
+      "eval_steps_per_second": 0.943,
+      "step": 549
+    },
+    {
+      "epoch": 3.9959183673469387,
+      "grad_norm": 0.830756425857544,
+      "learning_rate": 4.983095894354858e-05,
+      "loss": 1.0019,
+      "step": 732
+    },
+    {
+      "epoch": 3.9959183673469387,
+      "eval_accuracy": 0.5312463360300153,
+      "eval_f1": 0.33343763170872565,
+      "eval_loss": 2.056602954864502,
+      "eval_runtime": 17.7176,
+      "eval_samples_per_second": 481.386,
+      "eval_steps_per_second": 0.959,
+      "step": 732
+    },
+    {
+      "epoch": 4.995918367346938,
+      "grad_norm": 1.341150164604187,
+      "learning_rate": 4.9326121764495596e-05,
+      "loss": 0.4955,
+      "step": 915
+    },
+    {
+      "epoch": 4.995918367346938,
+      "eval_accuracy": 0.5872904209168719,
+      "eval_f1": 0.3966908687854425,
+      "eval_loss": 2.070507526397705,
+      "eval_runtime": 17.7204,
+      "eval_samples_per_second": 481.309,
+      "eval_steps_per_second": 0.959,
+      "step": 915
+    },
+    {
+      "epoch": 5.995918367346938,
+      "grad_norm": 1.4914641380310059,
+      "learning_rate": 4.849231551964771e-05,
+      "loss": 0.3149,
+      "step": 1098
+    },
+    {
+      "epoch": 5.995918367346938,
+      "eval_accuracy": 0.608277640989565,
+      "eval_f1": 0.41221796485256534,
+      "eval_loss": 2.174699544906616,
+      "eval_runtime": 18.7633,
+      "eval_samples_per_second": 454.558,
+      "eval_steps_per_second": 0.906,
+      "step": 1098
+    },
+    {
+      "epoch": 6.995918367346938,
+      "grad_norm": 1.016514539718628,
+      "learning_rate": 4.734081600808531e-05,
+      "loss": 0.2324,
+      "step": 1281
+    },
+    {
+      "epoch": 6.995918367346938,
+      "eval_accuracy": 0.6051119709227342,
+      "eval_f1": 0.42029644401424293,
+      "eval_loss": 2.536925792694092,
+      "eval_runtime": 19.0396,
+      "eval_samples_per_second": 447.961,
+      "eval_steps_per_second": 0.893,
+      "step": 1281
+    },
+    {
+      "epoch": 7.995918367346938,
+      "grad_norm": 0.6603855490684509,
+      "learning_rate": 4.588719528532342e-05,
+      "loss": 0.1825,
+      "step": 1464
+    },
+    {
+      "epoch": 7.995918367346938,
+      "eval_accuracy": 0.5930355258529723,
+      "eval_f1": 0.37922494807809526,
+      "eval_loss": 2.6477608680725098,
+      "eval_runtime": 18.8796,
+      "eval_samples_per_second": 451.757,
+      "eval_steps_per_second": 0.9,
+      "step": 1464
+    },
+    {
+      "epoch": 8.995918367346938,
+      "grad_norm": 0.9515678286552429,
+      "learning_rate": 4.415111107797445e-05,
+      "loss": 0.1581,
+      "step": 1647
+    },
+    {
+      "epoch": 8.995918367346938,
+      "eval_accuracy": 0.5848282330871145,
+      "eval_f1": 0.3902253760074279,
+      "eval_loss": 2.7652101516723633,
+      "eval_runtime": 28.9433,
+      "eval_samples_per_second": 294.68,
+      "eval_steps_per_second": 0.587,
+      "step": 1647
+    },
+    {
+      "epoch": 9.995918367346938,
+      "grad_norm": 0.5628945827484131,
+      "learning_rate": 4.215604094671835e-05,
+      "loss": 0.1386,
+      "step": 1830
+    },
+    {
+      "epoch": 9.995918367346938,
+      "eval_accuracy": 0.6253957087583538,
+      "eval_f1": 0.4363306793570824,
+      "eval_loss": 2.5493264198303223,
+      "eval_runtime": 17.9843,
+      "eval_samples_per_second": 474.247,
+      "eval_steps_per_second": 0.945,
+      "step": 1830
+    },
+    {
+      "epoch": 10.995918367346938,
+      "grad_norm": 0.5759875178337097,
+      "learning_rate": 3.9928964792569655e-05,
+      "loss": 0.13,
+      "step": 2013
+    },
+    {
+      "epoch": 10.995918367346938,
+      "eval_accuracy": 0.6325477781686012,
+      "eval_f1": 0.42658322719917263,
+      "eval_loss": 2.668961763381958,
+      "eval_runtime": 17.9422,
+      "eval_samples_per_second": 475.359,
+      "eval_steps_per_second": 0.947,
+      "step": 2013
+    },
+    {
+      "epoch": 11.995918367346938,
+      "grad_norm": 0.7909059524536133,
+      "learning_rate": 3.7500000000000003e-05,
+      "loss": 0.1134,
+      "step": 2196
+    },
+    {
+      "epoch": 11.995918367346938,
+      "eval_accuracy": 0.5902215969046781,
+      "eval_f1": 0.40717895597633597,
+      "eval_loss": 2.847268581390381,
+      "eval_runtime": 18.1922,
+      "eval_samples_per_second": 468.828,
+      "eval_steps_per_second": 0.934,
+      "step": 2196
+    },
+    {
+      "epoch": 12.995918367346938,
+      "grad_norm": 0.6743366718292236,
+      "learning_rate": 3.490199415097892e-05,
+      "loss": 0.1078,
+      "step": 2379
+    },
+    {
+      "epoch": 12.995918367346938,
+      "eval_accuracy": 0.6048774768437097,
+      "eval_f1": 0.40486374255791757,
+      "eval_loss": 2.909079074859619,
+      "eval_runtime": 17.3197,
+      "eval_samples_per_second": 492.446,
+      "eval_steps_per_second": 0.982,
+      "step": 2379
+    },
+    {
+      "epoch": 13.995918367346938,
+      "grad_norm": 0.6435021758079529,
+      "learning_rate": 3.217008081777726e-05,
+      "loss": 0.0929,
+      "step": 2562
+    },
+    {
+      "epoch": 13.995918367346938,
+      "eval_accuracy": 0.6124985344120061,
+      "eval_f1": 0.402051577315403,
+      "eval_loss": 2.901214599609375,
+      "eval_runtime": 18.278,
+      "eval_samples_per_second": 466.625,
+      "eval_steps_per_second": 0.93,
+      "step": 2562
+    },
+    {
+      "epoch": 14.995918367346938,
+      "grad_norm": 0.7225833535194397,
+      "learning_rate": 2.9341204441673266e-05,
+      "loss": 0.0879,
+      "step": 2745
+    },
+    {
+      "epoch": 14.995918367346938,
+      "eval_accuracy": 0.5815453159807715,
+      "eval_f1": 0.3787146481538575,
+      "eval_loss": 2.927959442138672,
+      "eval_runtime": 19.3124,
+      "eval_samples_per_second": 441.634,
+      "eval_steps_per_second": 0.88,
+      "step": 2745
+    },
+    {
+      "epoch": 15.995918367346938,
+      "grad_norm": 0.519130527973175,
+      "learning_rate": 2.6453620722761896e-05,
+      "loss": 0.0875,
+      "step": 2928
+    },
+    {
+      "epoch": 15.995918367346938,
+      "eval_accuracy": 0.6116778051354204,
+      "eval_f1": 0.42421911178450894,
+      "eval_loss": 2.8714120388031006,
+      "eval_runtime": 18.6944,
+      "eval_samples_per_second": 456.233,
+      "eval_steps_per_second": 0.909,
+      "step": 2928
+    },
+    {
+      "epoch": 16.99591836734694,
+      "grad_norm": 0.5847667455673218,
+      "learning_rate": 2.3546379277238107e-05,
+      "loss": 0.083,
+      "step": 3111
+    },
+    {
+      "epoch": 16.99591836734694,
+      "eval_accuracy": 0.604994723883222,
+      "eval_f1": 0.40283444897722465,
+      "eval_loss": 2.9251325130462646,
+      "eval_runtime": 19.0241,
+      "eval_samples_per_second": 448.325,
+      "eval_steps_per_second": 0.894,
+      "step": 3111
+    },
+    {
+      "epoch": 17.99591836734694,
+      "grad_norm": 0.5335302948951721,
+      "learning_rate": 2.0658795558326743e-05,
+      "loss": 0.0743,
+      "step": 3294
+    },
+    {
+      "epoch": 17.99591836734694,
+      "eval_accuracy": 0.6085121350685895,
+      "eval_f1": 0.3982368535619314,
+      "eval_loss": 2.907853364944458,
+      "eval_runtime": 18.6799,
+      "eval_samples_per_second": 456.587,
+      "eval_steps_per_second": 0.91,
+      "step": 3294
+    },
+    {
+      "epoch": 18.99591836734694,
+      "grad_norm": 0.6082349419593811,
+      "learning_rate": 1.7829919182222752e-05,
+      "loss": 0.0743,
+      "step": 3477
+    },
+    {
+      "epoch": 18.99591836734694,
+      "eval_accuracy": 0.6140227459256654,
+      "eval_f1": 0.40722488778058297,
+      "eval_loss": 2.9568777084350586,
+      "eval_runtime": 18.2131,
+      "eval_samples_per_second": 468.288,
+      "eval_steps_per_second": 0.933,
+      "step": 3477
+    },
+    {
+      "epoch": 19.99591836734694,
+      "grad_norm": 0.5372836589813232,
+      "learning_rate": 1.5112603381728762e-05,
+      "loss": 0.0745,
+      "step": 3660
+    },
+    {
+      "epoch": 19.99591836734694,
+      "eval_accuracy": 0.6022980419744401,
+      "eval_f1": 0.3888247133789473,
+      "eval_loss": 3.133009910583496,
+      "eval_runtime": 19.5015,
+      "eval_samples_per_second": 437.351,
+      "eval_steps_per_second": 0.872,
+      "step": 3660
+    },
+    {
+      "epoch": 20.99591836734694,
+      "grad_norm": 0.4080846905708313,
+      "learning_rate": 1.2513768458995337e-05,
+      "loss": 0.0641,
+      "step": 3843
+    },
+    {
+      "epoch": 20.99591836734694,
+      "eval_accuracy": 0.6041739946066362,
+      "eval_f1": 0.4024604989707059,
+      "eval_loss": 3.086355447769165,
+      "eval_runtime": 18.9488,
+      "eval_samples_per_second": 450.109,
+      "eval_steps_per_second": 0.897,
+      "step": 3843
+    },
+    {
+      "epoch": 21.99591836734694,
+      "grad_norm": 0.6301392316818237,
+      "learning_rate": 1.0083788397924998e-05,
+      "loss": 0.0611,
+      "step": 4026
+    },
+    {
+      "epoch": 21.99591836734694,
+      "eval_accuracy": 0.611560558095908,
+      "eval_f1": 0.4250797125355288,
+      "eval_loss": 3.1089813709259033,
+      "eval_runtime": 19.3666,
+      "eval_samples_per_second": 440.398,
+      "eval_steps_per_second": 0.878,
+      "step": 4026
+    },
+    {
+      "epoch": 22.99591836734694,
+      "grad_norm": 0.7403397560119629,
+      "learning_rate": 7.855524510252082e-06,
+      "loss": 0.0618,
+      "step": 4209
+    },
+    {
+      "epoch": 22.99591836734694,
+      "eval_accuracy": 0.6095673584241997,
+      "eval_f1": 0.38478101379896623,
+      "eval_loss": 3.165566921234131,
+      "eval_runtime": 18.268,
+      "eval_samples_per_second": 466.882,
+      "eval_steps_per_second": 0.931,
+      "step": 4209
+    },
+    {
+      "epoch": 23.99591836734694,
+      "grad_norm": 0.6018996238708496,
+      "learning_rate": 5.8591102425065766e-06,
+      "loss": 0.0595,
+      "step": 4392
+    },
+    {
+      "epoch": 23.99591836734694,
+      "eval_accuracy": 0.6026497830929769,
+      "eval_f1": 0.4033953887201948,
+      "eval_loss": 3.182464122772217,
+      "eval_runtime": 18.8509,
+      "eval_samples_per_second": 452.446,
+      "eval_steps_per_second": 0.902,
+      "step": 4392
+    },
+    {
+      "epoch": 24.99591836734694,
+      "grad_norm": 0.7152003049850464,
+      "learning_rate": 4.1215436728432114e-06,
+      "loss": 0.0549,
+      "step": 4575
+    },
+    {
+      "epoch": 24.99591836734694,
+      "eval_accuracy": 0.6062844413178567,
+      "eval_f1": 0.3998774411315016,
+      "eval_loss": 3.2211174964904785,
+      "eval_runtime": 18.4161,
+      "eval_samples_per_second": 463.128,
+      "eval_steps_per_second": 0.923,
+      "step": 4575
+    },
+    {
+      "epoch": 25.99591836734694,
+      "grad_norm": 0.655457615852356,
+      "learning_rate": 2.6663224083492645e-06,
+      "loss": 0.0578,
+      "step": 4758
+    },
+    {
+      "epoch": 25.99591836734694,
+      "eval_accuracy": 0.6093328643451753,
+      "eval_f1": 0.40241682477511076,
+      "eval_loss": 3.154259204864502,
+      "eval_runtime": 19.0328,
+      "eval_samples_per_second": 448.122,
+      "eval_steps_per_second": 0.893,
+      "step": 4758
+    },
+    {
+      "epoch": 26.99591836734694,
+      "grad_norm": 0.8799217939376831,
+      "learning_rate": 1.5131258202183586e-06,
+      "loss": 0.0531,
+      "step": 4941
+    },
+    {
+      "epoch": 26.99591836734694,
+      "eval_accuracy": 0.611560558095908,
+      "eval_f1": 0.4136571965633068,
+      "eval_loss": 3.1584064960479736,
+      "eval_runtime": 19.4229,
+      "eval_samples_per_second": 439.121,
+      "eval_steps_per_second": 0.875,
+      "step": 4941
+    },
+    {
+      "epoch": 27.99591836734694,
+      "grad_norm": 0.5971439480781555,
+      "learning_rate": 6.775489140148194e-07,
+      "loss": 0.0556,
+      "step": 5124
+    },
+    {
+      "epoch": 27.99591836734694,
+      "eval_accuracy": 0.6054637120412709,
+      "eval_f1": 0.4107652565512037,
+      "eval_loss": 3.177584171295166,
+      "eval_runtime": 18.7393,
+      "eval_samples_per_second": 455.14,
+      "eval_steps_per_second": 0.907,
+      "step": 5124
+    },
+    {
+      "epoch": 28.99591836734694,
+      "grad_norm": 0.5378488898277283,
+      "learning_rate": 1.7089143397631958e-07,
+      "loss": 0.0592,
+      "step": 5307
+    },
+    {
+      "epoch": 28.99591836734694,
+      "eval_accuracy": 0.604994723883222,
+      "eval_f1": 0.41074234435939105,
+      "eval_loss": 3.1705150604248047,
+      "eval_runtime": 19.1621,
+      "eval_samples_per_second": 445.096,
+      "eval_steps_per_second": 0.887,
+      "step": 5307
+    },
+    {
+      "epoch": 29.99591836734694,
+      "grad_norm": 0.7799643278121948,
+      "learning_rate": 5.053357646223056e-12,
+      "loss": 0.0511,
+      "step": 5490
+    },
+    {
+      "epoch": 29.99591836734694,
+      "eval_accuracy": 0.6051119709227342,
+      "eval_f1": 0.41072097568738997,
+      "eval_loss": 3.1688835620880127,
+      "eval_runtime": 18.8369,
+      "eval_samples_per_second": 452.78,
+      "eval_steps_per_second": 0.902,
+      "step": 5490
+    },
+    {
+      "epoch": 29.99591836734694,
+      "step": 5490,
+      "total_flos": 5.117922821239409e+20,
+      "train_loss": 0.060013725892225034,
+      "train_runtime": 5236.9953,
+      "train_samples_per_second": 2153.277,
+      "train_steps_per_second": 1.048
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 5490,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 30,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5.117922821239409e+20,
+  "train_batch_size": 128,
+  "trial_name": null,
+  "trial_params": null
+}