Upload folder using huggingface_hub
Browse files- app/content.py +27 -7
app/content.py
CHANGED
|
@@ -141,17 +141,37 @@ dataset_diaplay_information = {
|
|
| 141 |
'Parliament-Short': 'Under Development',
|
| 142 |
'UKUS-News-Short' : 'Under Development',
|
| 143 |
'Mediacorp-Short' : 'Under Development',
|
| 144 |
-
|
| 145 |
-
'YouTube ASR: English
|
| 146 |
-
|
| 147 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 148 |
|
| 149 |
'SEAME-Dev-Mandarin' : 'Under Development',
|
| 150 |
'SEAME-Dev-Singlish' : 'Under Development',
|
| 151 |
|
| 152 |
-
'YouTube SQA: English with Singapore Content': '
|
| 153 |
-
|
| 154 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 155 |
|
| 156 |
|
| 157 |
}
|
|
|
|
| 141 |
'Parliament-Short': 'Under Development',
|
| 142 |
'UKUS-News-Short' : 'Under Development',
|
| 143 |
'Mediacorp-Short' : 'Under Development',
|
| 144 |
+
|
| 145 |
+
'YouTube ASR: English Singapore Content' : '''YouTube Evaluation Dataset for ASR Task: \n
|
| 146 |
+
This dataset contains English and Singlish audio clips, featuring Singapore-related content. \n
|
| 147 |
+
It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
|
| 148 |
+
|
| 149 |
+
'YouTube ASR: English with Strong Emotion' : '''YouTube Evaluation Dataset for ASR Task: \n
|
| 150 |
+
This dataset contains English and some unknown languages audio clips, featuring speech with strong emotional expression. \n
|
| 151 |
+
It includes approximately 3.9 hours of audio, with each clip lasting 30 seconds.''',
|
| 152 |
+
|
| 153 |
+
'YouTube ASR: Malay English Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
|
| 154 |
+
This dataset mainly contains Malay and some English audio clips, featuring with English prompts. \n
|
| 155 |
+
It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
|
| 156 |
+
|
| 157 |
+
'YouTube ASR: Malay with Malay Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
|
| 158 |
+
This dataset use the same audio from *YouTube ASR: Malay English Prompt*, except featuring with Malay prompts. \n
|
| 159 |
+
It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
|
| 160 |
|
| 161 |
'SEAME-Dev-Mandarin' : 'Under Development',
|
| 162 |
'SEAME-Dev-Singlish' : 'Under Development',
|
| 163 |
|
| 164 |
+
'YouTube SQA: English with Singapore Content': '''YouTube Evaluation Dataset for Speech-QA Task: \n
|
| 165 |
+
This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
|
| 166 |
+
It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
|
| 167 |
+
|
| 168 |
+
'YouTube SDS: English with Singapore Content': '''YouTube Evaluation Dataset for Summary Task: \n
|
| 169 |
+
This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
|
| 170 |
+
It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
|
| 171 |
+
|
| 172 |
+
'YouTube PQA: English with Singapore Content': '''YouTube Evaluation Dataset for Paralinguistics Task: \n
|
| 173 |
+
This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
|
| 174 |
+
It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
|
| 175 |
|
| 176 |
|
| 177 |
}
|