Upload folder using huggingface_hub
Browse files- app/content.py +5 -5
- app/show_examples.py +0 -8
app/content.py
CHANGED
|
@@ -146,18 +146,18 @@ dataset_diaplay_information = {
|
|
| 146 |
|
| 147 |
'YouTube ASR: English with Strong Emotion' : 'YouTube Evaluation Dataset for ASR Task: <br> This dataset contains English and some unknown languages audio clips, featuring speech with strong emotional expression. <br> It includes approximately 3.9 hours of audio, with each clip lasting 30 seconds.',
|
| 148 |
|
| 149 |
-
'YouTube ASR: Malay English Prompt': 'YouTube Evaluation Dataset for ASR Task: <br> This dataset mainly contains Malay and some English audio clips, featuring with English prompts. <br> It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.',
|
| 150 |
|
| 151 |
-
'YouTube ASR: Malay with Malay Prompt': 'YouTube Evaluation Dataset for ASR Task: <br> This dataset use the same audio from <i>YouTube ASR: Malay English Prompt</i>, except featuring with Malay prompts. <br> It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.',
|
| 152 |
|
| 153 |
'SEAME-Dev-Mandarin' : 'Under Development',
|
| 154 |
'SEAME-Dev-Singlish' : 'Under Development',
|
| 155 |
|
| 156 |
-
'YouTube SQA: English with Singapore Content': 'YouTube Evaluation Dataset for Speech-QA Task: <br> This dataset
|
| 157 |
|
| 158 |
-
'YouTube SDS: English with Singapore Content': 'YouTube Evaluation Dataset for Summary Task: <br> This dataset
|
| 159 |
|
| 160 |
-
'YouTube PQA: English with Singapore Content': 'YouTube Evaluation Dataset for Paralinguistics Task: <br> This dataset
|
| 161 |
|
| 162 |
|
| 163 |
}
|
|
|
|
| 146 |
|
| 147 |
'YouTube ASR: English with Strong Emotion' : 'YouTube Evaluation Dataset for ASR Task: <br> This dataset contains English and some unknown languages audio clips, featuring speech with strong emotional expression. <br> It includes approximately 3.9 hours of audio, with each clip lasting 30 seconds.',
|
| 148 |
|
| 149 |
+
'YouTube ASR: Malay English Prompt': 'YouTube Evaluation Dataset for ASR Task: <br> This dataset mainly contains Malay and some Malay-English codeswitch audio clips, featuring with English prompts. <br> It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.',
|
| 150 |
|
| 151 |
+
# 'YouTube ASR: Malay with Malay Prompt': 'YouTube Evaluation Dataset for ASR Task: <br> This dataset use the same audio from <i>YouTube ASR: Malay English Prompt</i>, except featuring with Malay prompts. <br> It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.',
|
| 152 |
|
| 153 |
'SEAME-Dev-Mandarin' : 'Under Development',
|
| 154 |
'SEAME-Dev-Singlish' : 'Under Development',
|
| 155 |
|
| 156 |
+
'YouTube SQA: English with Singapore Content': 'YouTube Evaluation Dataset for Speech-QA Task: <br> This dataset contains English and Singlish audio clips, featuring Singapore-related content. <br> It includes approximately 7.6 hours of audio, with individual clips ranging from 8 seconds to 32 seconds in length.',
|
| 157 |
|
| 158 |
+
'YouTube SDS: English with Singapore Content': 'YouTube Evaluation Dataset for Summary Task: <br> This dataset contains English and Singlish audio clips, featuring Singapore-related content. <br> It includes approximately 5.4 hours of audio, with individual clips ranging from 8 seconds to 32 seconds in length.',
|
| 159 |
|
| 160 |
+
'YouTube PQA: English with Singapore Content': 'YouTube Evaluation Dataset for Paralinguistics QA Task: <br> This dataset contains English and Singlish audio clips, featuring Singapore-related content. <br> It includes approximately 41.4 hours of audio, with individual clips ranging from 41 seconds to 83 seconds in length.',
|
| 161 |
|
| 162 |
|
| 163 |
}
|
app/show_examples.py
CHANGED
|
@@ -60,14 +60,6 @@ def show_dataset_examples(display_name):
|
|
| 60 |
"""
|
| 61 |
st.markdown(custom_css, unsafe_allow_html=True)
|
| 62 |
|
| 63 |
-
# s = f"""<tr>
|
| 64 |
-
# <td><b>{html.escape(question_text.replace('(A)', '<br>(A)').replace('(B)', '<br>(B)').replace('(C)', '<br>(C)'))}
|
| 65 |
-
# </td>
|
| 66 |
-
# <td><b>{html.escape(dataset[index]['answer']['text'])}
|
| 67 |
-
# </td>
|
| 68 |
-
# </tr>
|
| 69 |
-
# """
|
| 70 |
-
|
| 71 |
body_details = f"""<table style="table-layout: fixed; width:100%">
|
| 72 |
<thead>
|
| 73 |
<tr style="text-align: center;">
|
|
|
|
| 60 |
"""
|
| 61 |
st.markdown(custom_css, unsafe_allow_html=True)
|
| 62 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 63 |
body_details = f"""<table style="table-layout: fixed; width:100%">
|
| 64 |
<thead>
|
| 65 |
<tr style="text-align: center;">
|