zhuohan-7 commited on
Commit
3732534
·
1 Parent(s): 42ba589

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. app/content.py +16 -16
app/content.py CHANGED
@@ -143,35 +143,35 @@ dataset_diaplay_information = {
143
  'Mediacorp-Short' : 'Under Development',
144
 
145
  'YouTube ASR: English Singapore Content' : '''YouTube Evaluation Dataset for ASR Task: \n
146
- This dataset contains English and Singlish audio clips, featuring Singapore-related content. \n
147
- It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
148
 
149
  'YouTube ASR: English with Strong Emotion' : '''YouTube Evaluation Dataset for ASR Task: \n
150
- This dataset contains English and some unknown languages audio clips, featuring speech with strong emotional expression. \n
151
- It includes approximately 3.9 hours of audio, with each clip lasting 30 seconds.''',
152
 
153
- 'YouTube ASR: Malay English Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
154
- This dataset mainly contains Malay and some English audio clips, featuring with English prompts. \n
155
- It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
156
 
157
- 'YouTube ASR: Malay with Malay Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
158
- This dataset use the same audio from *YouTube ASR: Malay English Prompt*, except featuring with Malay prompts. \n
159
- It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
160
 
161
  'SEAME-Dev-Mandarin' : 'Under Development',
162
  'SEAME-Dev-Singlish' : 'Under Development',
163
 
164
  'YouTube SQA: English with Singapore Content': '''YouTube Evaluation Dataset for Speech-QA Task: \n
165
- This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
166
- It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
167
 
168
  'YouTube SDS: English with Singapore Content': '''YouTube Evaluation Dataset for Summary Task: \n
169
- This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
170
- It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
171
 
172
  'YouTube PQA: English with Singapore Content': '''YouTube Evaluation Dataset for Paralinguistics Task: \n
173
- This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
174
- It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
175
 
176
 
177
  }
 
143
  'Mediacorp-Short' : 'Under Development',
144
 
145
  'YouTube ASR: English Singapore Content' : '''YouTube Evaluation Dataset for ASR Task: \n
146
+ This dataset contains English and Singlish audio clips, featuring Singapore-related content. \n
147
+ It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
148
 
149
  'YouTube ASR: English with Strong Emotion' : '''YouTube Evaluation Dataset for ASR Task: \n
150
+ This dataset contains English and some unknown languages audio clips, featuring speech with strong emotional expression. \n
151
+ It includes approximately 3.9 hours of audio, with each clip lasting 30 seconds.''',
152
 
153
+ 'YouTube ASR: Malay English Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
154
+ This dataset mainly contains Malay and some English audio clips, featuring with English prompts. \n
155
+ It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
156
 
157
+ 'YouTube ASR: Malay with Malay Prompt': '''YouTube Evaluation Dataset for ASR Task: \n
158
+ This dataset use the same audio from *YouTube ASR: Malay English Prompt*, except featuring with Malay prompts. \n
159
+ It includes approximately 2.55 hours of audio, with indicidual clips ranging form 30 seconds to 95 seconds in length.''',
160
 
161
  'SEAME-Dev-Mandarin' : 'Under Development',
162
  'SEAME-Dev-Singlish' : 'Under Development',
163
 
164
  'YouTube SQA: English with Singapore Content': '''YouTube Evaluation Dataset for Speech-QA Task: \n
165
+ This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
166
+ It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
167
 
168
  'YouTube SDS: English with Singapore Content': '''YouTube Evaluation Dataset for Summary Task: \n
169
+ This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
170
+ It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
171
 
172
  'YouTube PQA: English with Singapore Content': '''YouTube Evaluation Dataset for Paralinguistics Task: \n
173
+ This dataset use the same audio from *YouTube ASR: English Singapore Content*, featuring Singapore-related content. \n
174
+ It includes approximately 2.5 hours of audio, with individual clips ranging from 2 seconds to 30 seconds in length.''',
175
 
176
 
177
  }