update meralion api
Browse files- model_information.py +7 -3
- results_organized/wer/asr_english.csv +2 -1
- results_organized/wer/asr_indonesian.csv +2 -1
- results_organized/wer/asr_malay.csv +2 -1
- results_organized/wer/asr_mandarin.csv +2 -1
- results_organized/wer/asr_private.csv +2 -1
- results_organized/wer/asr_singlish.csv +2 -1
- results_organized/wer/asr_tamil.csv +2 -1
- results_organized/wer/asr_thai.csv +2 -1
- results_organized/wer/asr_vietnamese.csv +2 -1
model_information.py
CHANGED
|
@@ -12,6 +12,10 @@ data['Original Name'].append('Omnilingual-ASR-7B')
|
|
| 12 |
data['Proper Display Name'].append('Fusion: Omnilingual-LLM-ASR-7B')
|
| 13 |
data['Link'].append('https://arxiv.org/abs/2511.09690')
|
| 14 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 15 |
data['Original Name'].append('SALMONN_7B')
|
| 16 |
data['Proper Display Name'].append('Fusion: SALMONN-7B')
|
| 17 |
data['Link'].append('https://arxiv.org/html/2310.13289v2')
|
|
@@ -42,15 +46,15 @@ data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-AudioLLM-Whisper-S
|
|
| 42 |
|
| 43 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-2b')
|
| 44 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-3B')
|
| 45 |
-
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-
|
| 46 |
|
| 47 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-9b')
|
| 48 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-10B')
|
| 49 |
-
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-
|
| 50 |
|
| 51 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-9b-asr')
|
| 52 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-10B-ASR')
|
| 53 |
-
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-
|
| 54 |
|
| 55 |
data['Original Name'].append('MERaLiON-SpeechEncoder2-ASR-CTC')
|
| 56 |
data['Proper Display Name'].append('Fusion: MERaLiON-SpeechEncoder2-ASR-CTC')
|
|
|
|
| 12 |
data['Proper Display Name'].append('Fusion: Omnilingual-LLM-ASR-7B')
|
| 13 |
data['Link'].append('https://arxiv.org/abs/2511.09690')
|
| 14 |
|
| 15 |
+
data['Original Name'].append('MERaLiON-ASR-dev-1215')
|
| 16 |
+
data['Proper Display Name'].append('🌟 API: MERaLiON-ASR-dev-1215')
|
| 17 |
+
data['Link'].append("")
|
| 18 |
+
|
| 19 |
data['Original Name'].append('SALMONN_7B')
|
| 20 |
data['Proper Display Name'].append('Fusion: SALMONN-7B')
|
| 21 |
data['Link'].append('https://arxiv.org/html/2310.13289v2')
|
|
|
|
| 46 |
|
| 47 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-2b')
|
| 48 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-3B')
|
| 49 |
+
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-3B')
|
| 50 |
|
| 51 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-9b')
|
| 52 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-10B')
|
| 53 |
+
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-10B')
|
| 54 |
|
| 55 |
data['Original Name'].append('MERaLiON-AudioLLM-v2-9b-asr')
|
| 56 |
data['Proper Display Name'].append('Fusion: MERaLiON-2-10B-ASR')
|
| 57 |
+
data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-10B-ASR')
|
| 58 |
|
| 59 |
data['Original Name'].append('MERaLiON-SpeechEncoder2-ASR-CTC')
|
| 60 |
data['Proper Display Name'].append('Fusion: MERaLiON-SpeechEncoder2-ASR-CTC')
|
results_organized/wer/asr_english.csv
CHANGED
|
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.0168446070849209,0.0385117370003972,0.07948914070484
|
|
| 19 |
whisper_large_v3,0.0189383936318708,0.0363175515917301,0.0981932241083422,0.1455769221247146,0.0959389704905374,0.1078364887549888,0.1409171231397644,0.0382882083673397,0.045559297996809
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0412,0.0623,0.1248,0.2095,0.1334,0.153,0.1682,0.0421999999999999,0.044
|
| 21 |
Omnilingual-ASR-7B,0.0300218752357245,0.0559032044616693,0.1274849641078704,0.9775582765878016,0.8353292063587463,0.515911215279231,0.5435311281558622,1.128111996614712,0.9943988445415156
|
| 22 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 19 |
whisper_large_v3,0.0189383936318708,0.0363175515917301,0.0981932241083422,0.1455769221247146,0.0959389704905374,0.1078364887549888,0.1409171231397644,0.0382882083673397,0.045559297996809
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0412,0.0623,0.1248,0.2095,0.1334,0.153,0.1682,0.0421999999999999,0.044
|
| 21 |
Omnilingual-ASR-7B,0.0300218752357245,0.0559032044616693,0.1274849641078704,0.9775582765878016,0.8353292063587463,0.515911215279231,0.5435311281558622,1.128111996614712,0.9943988445415156
|
| 22 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.0271931809610017,0.0493241327157576,0.1246006596391385,0.2870196328399719,0.1640247017459506,0.2035017229593047,0.2580305229955792,0.1014881162282248,0.1441857188149505
|
| 23 |
+
MERaLiON-ASR-dev-1215,0.02039084015543064,0.03707416724989124,0.07147768973207114,0.19285698959693273,0.08599886183875714,0.08238096296872742,0.12177009165959526,0.02913310386430574,0.02903740471547598
|
results_organized/wer/asr_indonesian.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.327169012788665,5.803850364012302
|
|
| 14 |
whisper_large_v3,0.0781580642193394,0.1960453842545132
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0559,0.1662
|
| 16 |
Omnilingual-ASR-7B,0.1532246831034963,0.2589953312037069
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.0781580642193394,0.1960453842545132
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0559,0.1662
|
| 16 |
Omnilingual-ASR-7B,0.1532246831034963,0.2589953312037069
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1189116404327436,0.2440411415733492
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.06941760971570522,0.15281566556043993
|
results_organized/wer/asr_malay.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,3.762932736606555
|
|
| 14 |
whisper_large_v3,0.2196919836777675
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1559
|
| 16 |
Omnilingual-ASR-7B,0.3238279808047249
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.2196919836777675
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1559
|
| 16 |
Omnilingual-ASR-7B,0.3238279808047249
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.292266519010705
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.1668641130270721
|
results_organized/wer/asr_mandarin.csv
CHANGED
|
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.1223297895507909,0.154221316286565,0.440084790673025
|
|
| 19 |
whisper_large_v3,0.1245471283482805,0.1975710489525415,0.190821409644939
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0747,0.1651,0.1769
|
| 21 |
Omnilingual-ASR-7B,0.0896792945465293,0.1433522201788049,0.2534749710035532
|
| 22 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 19 |
whisper_large_v3,0.1245471283482805,0.1975710489525415,0.190821409644939
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0747,0.1651,0.1769
|
| 21 |
Omnilingual-ASR-7B,0.0896792945465293,0.1433522201788049,0.2534749710035532
|
| 22 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.076713138578255,0.1254929891887869,0.2504740688918754
|
| 23 |
+
MERaLiON-ASR-dev-1215,0.04177307913127833,0.10956959755824253,0.14183359830418654
|
results_organized/wer/asr_private.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,0.1908042294136494,0.5388096066829099,0.26073567151411
|
|
| 14 |
whisper_large_v3,0.1416212752322973,0.1879568395405499,0.1654405474764756,0.1163705869125253,0.1128716105847762,0.0670829785220929,0.0697674418604651,0.106860259660444,0.0816953184128013
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1628,0.1753,0.1855,0.1176,0.1052,0.0616,0.0803999999999999,0.1152,0.1192
|
| 16 |
Omnilingual-ASR-7B,1.0476568285200465,1.006522122333862,0.9160827209024098,1.033498201438849,0.9437056375948436,0.8528543878807593,0.9335548172757476,0.8400923927448976,0.7837808598567627
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.1416212752322973,0.1879568395405499,0.1654405474764756,0.1163705869125253,0.1128716105847762,0.0670829785220929,0.0697674418604651,0.106860259660444,0.0816953184128013
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1628,0.1753,0.1855,0.1176,0.1052,0.0616,0.0803999999999999,0.1152,0.1192
|
| 16 |
Omnilingual-ASR-7B,1.0476568285200465,1.006522122333862,0.9160827209024098,1.033498201438849,0.9437056375948436,0.8528543878807593,0.9335548172757476,0.8400923927448976,0.7837808598567627
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.2740399873056172,0.317644985016746,0.2775593915569988,0.2366232014388489,0.2033123929183324,0.1723088361718441,0.2139310911194893,0.8400923927448976,0.7837808598567627
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.12277047954715369,0.14096762965541246,0.17005988023952096,0.11378457387002473,0.09931394968964391,0.0442331346390387,0.05399886557005105,0.08873012214796036,0.10024867553249
|
results_organized/wer/asr_singlish.csv
CHANGED
|
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.0576158778923755,0.3451018586153721,0.43818394113014
|
|
| 19 |
whisper_large_v3,0.0691975715017189,0.319251684116549,0.2671952643440953,0.4567139031045279,0.2108972581751324,0.1704161888919394
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0486,0.0511,0.1856,0.2678,0.1363,0.0968
|
| 21 |
Omnilingual-ASR-7B,0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
|
| 22 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 19 |
whisper_large_v3,0.0691975715017189,0.319251684116549,0.2671952643440953,0.4567139031045279,0.2108972581751324,0.1704161888919394
|
| 20 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.0486,0.0511,0.1856,0.2678,0.1363,0.0968
|
| 21 |
Omnilingual-ASR-7B,0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
|
| 22 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
|
| 23 |
+
MERaLiON-ASR-dev-1215,0.04330334284251335,0.05137570002434867,0.18361528226572896,0.23871795194205886,0.13380805766733303,0.0957702805277863
|
results_organized/wer/asr_tamil.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.1784589191228196,1.7016514406184118,2.75005672425529
|
|
| 14 |
whisper_large_v3,0.2448438631011245,0.2314476458186929,0.8481572720495284
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1442,0.1632,0.6578
|
| 16 |
Omnilingual-ASR-7B,0.3144055763521363,0.1062680115273775,0.867817443980474
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.3144055763521363,0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.2448438631011245,0.2314476458186929,0.8481572720495284
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1442,0.1632,0.6578
|
| 16 |
Omnilingual-ASR-7B,0.3144055763521363,0.1062680115273775,0.867817443980474
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.3144055763521363,0.1062680115273775,0.8675527848026818
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.12422135451181095,0.13475052705551652,0.49745551197692134
|
results_organized/wer/asr_thai.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.7344522925894887,1.2856834920064666
|
|
| 14 |
whisper_large_v3,0.2139446905303483,0.0282019040776001
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1669999999999999,0.0137
|
| 16 |
Omnilingual-ASR-7B,0.2754222795926698,0.4428487279459202
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.2139446905303483,0.0282019040776001
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1669999999999999,0.0137
|
| 16 |
Omnilingual-ASR-7B,0.2754222795926698,0.4428487279459202
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1880426747867915,0.0330706011051583
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.15903747156710163,0.009951499910185018
|
results_organized/wer/asr_vietnamese.csv
CHANGED
|
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.1070294304467498,2.5042567310800923
|
|
| 14 |
whisper_large_v3,0.1366716070294304,0.1602754255313115
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1987999999999999,0.1322
|
| 16 |
Omnilingual-ASR-7B,0.1417272338606242,0.1516119663084519
|
| 17 |
-
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.
|
|
|
|
|
|
| 14 |
whisper_large_v3,0.1366716070294304,0.1602754255313115
|
| 15 |
MERaLiON-SpeechEncoder2-ASR-CTC,0.1987999999999999,0.1322
|
| 16 |
Omnilingual-ASR-7B,0.1417272338606242,0.1516119663084519
|
| 17 |
+
Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1260153911928174,0.1467789718268951
|
| 18 |
+
MERaLiON-ASR-dev-1215,0.12428541181452467,0.07845317028625878
|