YingxuHe commited on
Commit
1f2ebc8
·
1 Parent(s): b812428

update meralion api

Browse files
model_information.py CHANGED
@@ -12,6 +12,10 @@ data['Original Name'].append('Omnilingual-ASR-7B')
12
  data['Proper Display Name'].append('Fusion: Omnilingual-LLM-ASR-7B')
13
  data['Link'].append('https://arxiv.org/abs/2511.09690')
14
 
 
 
 
 
15
  data['Original Name'].append('SALMONN_7B')
16
  data['Proper Display Name'].append('Fusion: SALMONN-7B')
17
  data['Link'].append('https://arxiv.org/html/2310.13289v2')
@@ -42,15 +46,15 @@ data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-AudioLLM-Whisper-S
42
 
43
  data['Original Name'].append('MERaLiON-AudioLLM-v2-2b')
44
  data['Proper Display Name'].append('Fusion: MERaLiON-2-3B')
45
- data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-AudioLLM-Whisper-SEA-LION')
46
 
47
  data['Original Name'].append('MERaLiON-AudioLLM-v2-9b')
48
  data['Proper Display Name'].append('Fusion: MERaLiON-2-10B')
49
- data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-AudioLLM-Whisper-SEA-LION')
50
 
51
  data['Original Name'].append('MERaLiON-AudioLLM-v2-9b-asr')
52
  data['Proper Display Name'].append('Fusion: MERaLiON-2-10B-ASR')
53
- data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-AudioLLM-Whisper-SEA-LION')
54
 
55
  data['Original Name'].append('MERaLiON-SpeechEncoder2-ASR-CTC')
56
  data['Proper Display Name'].append('Fusion: MERaLiON-SpeechEncoder2-ASR-CTC')
 
12
  data['Proper Display Name'].append('Fusion: Omnilingual-LLM-ASR-7B')
13
  data['Link'].append('https://arxiv.org/abs/2511.09690')
14
 
15
+ data['Original Name'].append('MERaLiON-ASR-dev-1215')
16
+ data['Proper Display Name'].append('🌟 API: MERaLiON-ASR-dev-1215')
17
+ data['Link'].append("")
18
+
19
  data['Original Name'].append('SALMONN_7B')
20
  data['Proper Display Name'].append('Fusion: SALMONN-7B')
21
  data['Link'].append('https://arxiv.org/html/2310.13289v2')
 
46
 
47
  data['Original Name'].append('MERaLiON-AudioLLM-v2-2b')
48
  data['Proper Display Name'].append('Fusion: MERaLiON-2-3B')
49
+ data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-3B')
50
 
51
  data['Original Name'].append('MERaLiON-AudioLLM-v2-9b')
52
  data['Proper Display Name'].append('Fusion: MERaLiON-2-10B')
53
+ data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-10B')
54
 
55
  data['Original Name'].append('MERaLiON-AudioLLM-v2-9b-asr')
56
  data['Proper Display Name'].append('Fusion: MERaLiON-2-10B-ASR')
57
+ data['Link'].append('https://huggingface.co/MERaLiON/MERaLiON-2-10B-ASR')
58
 
59
  data['Original Name'].append('MERaLiON-SpeechEncoder2-ASR-CTC')
60
  data['Proper Display Name'].append('Fusion: MERaLiON-SpeechEncoder2-ASR-CTC')
results_organized/wer/asr_english.csv CHANGED
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.0168446070849209,0.0385117370003972,0.07948914070484
19
  whisper_large_v3,0.0189383936318708,0.0363175515917301,0.0981932241083422,0.1455769221247146,0.0959389704905374,0.1078364887549888,0.1409171231397644,0.0382882083673397,0.045559297996809
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0412,0.0623,0.1248,0.2095,0.1334,0.153,0.1682,0.0421999999999999,0.044
21
  Omnilingual-ASR-7B,0.0300218752357245,0.0559032044616693,0.1274849641078704,0.9775582765878016,0.8353292063587463,0.515911215279231,0.5435311281558622,1.128111996614712,0.9943988445415156
22
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.027193180961001734,0.04932413271575763,0.12460065963913859,0.2870196328399719,0.16402470174595066,0.2035017229593047,0.2580305229955792,0.10148811622822485,0.14418571881495051
 
 
19
  whisper_large_v3,0.0189383936318708,0.0363175515917301,0.0981932241083422,0.1455769221247146,0.0959389704905374,0.1078364887549888,0.1409171231397644,0.0382882083673397,0.045559297996809
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0412,0.0623,0.1248,0.2095,0.1334,0.153,0.1682,0.0421999999999999,0.044
21
  Omnilingual-ASR-7B,0.0300218752357245,0.0559032044616693,0.1274849641078704,0.9775582765878016,0.8353292063587463,0.515911215279231,0.5435311281558622,1.128111996614712,0.9943988445415156
22
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.0271931809610017,0.0493241327157576,0.1246006596391385,0.2870196328399719,0.1640247017459506,0.2035017229593047,0.2580305229955792,0.1014881162282248,0.1441857188149505
23
+ MERaLiON-ASR-dev-1215,0.02039084015543064,0.03707416724989124,0.07147768973207114,0.19285698959693273,0.08599886183875714,0.08238096296872742,0.12177009165959526,0.02913310386430574,0.02903740471547598
results_organized/wer/asr_indonesian.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.327169012788665,5.803850364012302
14
  whisper_large_v3,0.0781580642193394,0.1960453842545132
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0559,0.1662
16
  Omnilingual-ASR-7B,0.1532246831034963,0.2589953312037069
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.11891164043274365,0.24404114157334925
 
 
14
  whisper_large_v3,0.0781580642193394,0.1960453842545132
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0559,0.1662
16
  Omnilingual-ASR-7B,0.1532246831034963,0.2589953312037069
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1189116404327436,0.2440411415733492
18
+ MERaLiON-ASR-dev-1215,0.06941760971570522,0.15281566556043993
results_organized/wer/asr_malay.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,3.762932736606555
14
  whisper_large_v3,0.2196919836777675
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1559
16
  Omnilingual-ASR-7B,0.3238279808047249
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.29226651901070505
 
 
14
  whisper_large_v3,0.2196919836777675
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1559
16
  Omnilingual-ASR-7B,0.3238279808047249
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.292266519010705
18
+ MERaLiON-ASR-dev-1215,0.1668641130270721
results_organized/wer/asr_mandarin.csv CHANGED
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.1223297895507909,0.154221316286565,0.440084790673025
19
  whisper_large_v3,0.1245471283482805,0.1975710489525415,0.190821409644939
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0747,0.1651,0.1769
21
  Omnilingual-ASR-7B,0.0896792945465293,0.1433522201788049,0.2534749710035532
22
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.07671313857825508,0.12549298918878696,0.25047406889187546
 
 
19
  whisper_large_v3,0.1245471283482805,0.1975710489525415,0.190821409644939
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0747,0.1651,0.1769
21
  Omnilingual-ASR-7B,0.0896792945465293,0.1433522201788049,0.2534749710035532
22
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.076713138578255,0.1254929891887869,0.2504740688918754
23
+ MERaLiON-ASR-dev-1215,0.04177307913127833,0.10956959755824253,0.14183359830418654
results_organized/wer/asr_private.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,0.1908042294136494,0.5388096066829099,0.26073567151411
14
  whisper_large_v3,0.1416212752322973,0.1879568395405499,0.1654405474764756,0.1163705869125253,0.1128716105847762,0.0670829785220929,0.0697674418604651,0.106860259660444,0.0816953184128013
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1628,0.1753,0.1855,0.1176,0.1052,0.0616,0.0803999999999999,0.1152,0.1192
16
  Omnilingual-ASR-7B,1.0476568285200465,1.006522122333862,0.9160827209024098,1.033498201438849,0.9437056375948436,0.8528543878807593,0.9335548172757476,0.8400923927448976,0.7837808598567627
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.27403998730561724,0.317644985016746,0.2775593915569988,0.23662320143884893,0.2033123929183324,0.17230883617184414,0.21393109111948935,0.8400923927448976,0.7837808598567627
 
 
14
  whisper_large_v3,0.1416212752322973,0.1879568395405499,0.1654405474764756,0.1163705869125253,0.1128716105847762,0.0670829785220929,0.0697674418604651,0.106860259660444,0.0816953184128013
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1628,0.1753,0.1855,0.1176,0.1052,0.0616,0.0803999999999999,0.1152,0.1192
16
  Omnilingual-ASR-7B,1.0476568285200465,1.006522122333862,0.9160827209024098,1.033498201438849,0.9437056375948436,0.8528543878807593,0.9335548172757476,0.8400923927448976,0.7837808598567627
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.2740399873056172,0.317644985016746,0.2775593915569988,0.2366232014388489,0.2033123929183324,0.1723088361718441,0.2139310911194893,0.8400923927448976,0.7837808598567627
18
+ MERaLiON-ASR-dev-1215,0.12277047954715369,0.14096762965541246,0.17005988023952096,0.11378457387002473,0.09931394968964391,0.0442331346390387,0.05399886557005105,0.08873012214796036,0.10024867553249
results_organized/wer/asr_singlish.csv CHANGED
@@ -19,4 +19,5 @@ phi_4_multimodal_instruct,0.0576158778923755,0.3451018586153721,0.43818394113014
19
  whisper_large_v3,0.0691975715017189,0.319251684116549,0.2671952643440953,0.4567139031045279,0.2108972581751324,0.1704161888919394
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0486,0.0511,0.1856,0.2678,0.1363,0.0968
21
  Omnilingual-ASR-7B,0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
22
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.18169848584595127,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
 
 
19
  whisper_large_v3,0.0691975715017189,0.319251684116549,0.2671952643440953,0.4567139031045279,0.2108972581751324,0.1704161888919394
20
  MERaLiON-SpeechEncoder2-ASR-CTC,0.0486,0.0511,0.1856,0.2678,0.1363,0.0968
21
  Omnilingual-ASR-7B,0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
22
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1816984858459512,0.4328902788636956,0.975503383060243,0.8850665821179454,0.9044736152749075,0.8963283965903138
23
+ MERaLiON-ASR-dev-1215,0.04330334284251335,0.05137570002434867,0.18361528226572896,0.23871795194205886,0.13380805766733303,0.0957702805277863
results_organized/wer/asr_tamil.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.1784589191228196,1.7016514406184118,2.75005672425529
14
  whisper_large_v3,0.2448438631011245,0.2314476458186929,0.8481572720495284
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1442,0.1632,0.6578
16
  Omnilingual-ASR-7B,0.3144055763521363,0.1062680115273775,0.867817443980474
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.3144055763521363,0.10626801152737753,0.8675527848026818
 
 
14
  whisper_large_v3,0.2448438631011245,0.2314476458186929,0.8481572720495284
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1442,0.1632,0.6578
16
  Omnilingual-ASR-7B,0.3144055763521363,0.1062680115273775,0.867817443980474
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.3144055763521363,0.1062680115273775,0.8675527848026818
18
+ MERaLiON-ASR-dev-1215,0.12422135451181095,0.13475052705551652,0.49745551197692134
results_organized/wer/asr_thai.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.7344522925894887,1.2856834920064666
14
  whisper_large_v3,0.2139446905303483,0.0282019040776001
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1669999999999999,0.0137
16
  Omnilingual-ASR-7B,0.2754222795926698,0.4428487279459202
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.18804267478679157,0.03307060110515834
 
 
14
  whisper_large_v3,0.2139446905303483,0.0282019040776001
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1669999999999999,0.0137
16
  Omnilingual-ASR-7B,0.2754222795926698,0.4428487279459202
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1880426747867915,0.0330706011051583
18
+ MERaLiON-ASR-dev-1215,0.15903747156710163,0.009951499910185018
results_organized/wer/asr_vietnamese.csv CHANGED
@@ -14,4 +14,5 @@ phi_4_multimodal_instruct,1.1070294304467498,2.5042567310800923
14
  whisper_large_v3,0.1366716070294304,0.1602754255313115
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1987999999999999,0.1322
16
  Omnilingual-ASR-7B,0.1417272338606242,0.1516119663084519
17
- Fusion: Omnilingual-LLM-ASR-7B[with language code],0.12601539119281743,0.14677897182689514
 
 
14
  whisper_large_v3,0.1366716070294304,0.1602754255313115
15
  MERaLiON-SpeechEncoder2-ASR-CTC,0.1987999999999999,0.1322
16
  Omnilingual-ASR-7B,0.1417272338606242,0.1516119663084519
17
+ Fusion: Omnilingual-LLM-ASR-7B[with language code],0.1260153911928174,0.1467789718268951
18
+ MERaLiON-ASR-dev-1215,0.12428541181452467,0.07845317028625878