binwang commited on
Commit
0688ab3
·
verified ·
1 Parent(s): 969eb10

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. app/content.py +22 -23
  2. app/pages.py +2 -0
app/content.py CHANGED
@@ -108,29 +108,28 @@ dataset_diaplay_information = {
108
  'VoxCeleb-Accent' : 'Test dataset for accent recognition, based on VoxCeleb, a large speaker identification dataset.',
109
  'MNSC-AR-Sentence' : 'Accent recognition based on the IMDA NSC dataset, focusing on sentence-level accents.',
110
  'MNSC-AR-Dialogue' : 'Accent recognition based on the IMDA NSC dataset, focusing on dialogue-level accents.',
111
-
112
- 'VoxCeleb-Gender': 'Test dataset for gender classification, also derived from VoxCeleb.',
113
- 'IEMOCAP-Gender' : 'Gender classification based on the IEMOCAP dataset.',
114
- 'IEMOCAP-Emotion': 'Emotion recognition test data from the IEMOCAP dataset, focusing on identifying emotions in speech.',
115
- 'MELD-Sentiment' : 'Sentiment recognition from speech using the MELD dataset, classifying positive, negative, or neutral sentiments.',
116
- 'MELD-Emotion' : 'Emotion classification in speech using MELD, detecting specific emotions like happiness, anger, etc.',
117
- 'MuChoMusic' : 'Test dataset for music understanding, from paper: MuChoMusic: Evaluating Music Understanding in Multimodal Audio-Language Models.',
118
- 'MNSC-PART1-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 1.',
119
- 'MNSC-PART2-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 2.',
120
- 'MNSC-PART3-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 3.',
121
- 'MNSC-PART4-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 4.',
122
- 'MNSC-PART5-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 5.',
123
- 'MNSC-PART6-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 6.',
124
- 'MNSC-PART3-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 3.',
125
- 'MNSC-PART4-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 4.',
126
- 'MNSC-PART5-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 5.',
127
- 'MNSC-PART6-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 6.',
128
- 'MNSC-PART3-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 3.',
129
- 'MNSC-PART4-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 4.',
130
- 'MNSC-PART5-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 5.',
131
- 'MNSC-PART6-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 6.',
132
- 'SEAME-Dev-Man' : 'SEAME dataset, English-Mandarin Code-swithcing',
133
- 'SEAME-Dev-Sge' : 'SEAME dataset, English-Mandarin Code-swithcing',
134
 
135
  'CNA' : 'Under Development',
136
  'IDPC' : 'Under Development',
 
108
  'VoxCeleb-Accent' : 'Test dataset for accent recognition, based on VoxCeleb, a large speaker identification dataset.',
109
  'MNSC-AR-Sentence' : 'Accent recognition based on the IMDA NSC dataset, focusing on sentence-level accents.',
110
  'MNSC-AR-Dialogue' : 'Accent recognition based on the IMDA NSC dataset, focusing on dialogue-level accents.',
111
+ 'VoxCeleb-Gender' : 'Test dataset for gender classification, also derived from VoxCeleb.',
112
+ 'IEMOCAP-Gender' : 'Gender classification based on the IEMOCAP dataset.',
113
+ 'IEMOCAP-Emotion' : 'Emotion recognition test data from the IEMOCAP dataset, focusing on identifying emotions in speech.',
114
+ 'MELD-Sentiment' : 'Sentiment recognition from speech using the MELD dataset, classifying positive, negative, or neutral sentiments.',
115
+ 'MELD-Emotion' : 'Emotion classification in speech using MELD, detecting specific emotions like happiness, anger, etc.',
116
+ 'MuChoMusic' : 'Test dataset for music understanding, from paper: MuChoMusic: Evaluating Music Understanding in Multimodal Audio-Language Models.',
117
+ 'MNSC-PART1-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 1.',
118
+ 'MNSC-PART2-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 2.',
119
+ 'MNSC-PART3-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 3.',
120
+ 'MNSC-PART4-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 4.',
121
+ 'MNSC-PART5-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 5.',
122
+ 'MNSC-PART6-ASR' : 'Speech recognition test data from the IMDA NSC project, Part 6.',
123
+ 'MNSC-PART3-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 3.',
124
+ 'MNSC-PART4-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 4.',
125
+ 'MNSC-PART5-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 5.',
126
+ 'MNSC-PART6-SQA' : 'Multitak National Speech Corpus (MNSC) dataset, Question answering task, Part 6.',
127
+ 'MNSC-PART3-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 3.',
128
+ 'MNSC-PART4-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 4.',
129
+ 'MNSC-PART5-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 5.',
130
+ 'MNSC-PART6-SDS' : 'Multitak National Speech Corpus (MNSC) dataset, dialogue summarization task, Part 6.',
131
+ 'SEAME-Dev-Man' : 'SEAME dataset, English-Mandarin Code-swithcing',
132
+ 'SEAME-Dev-Sge' : 'SEAME dataset, English-Mandarin Code-swithcing',
 
133
 
134
  'CNA' : 'Under Development',
135
  'IDPC' : 'Under Development',
app/pages.py CHANGED
@@ -167,6 +167,8 @@ def asr_singlish():
167
  'MNSC-PART4-ASR',
168
  'MNSC-PART5-ASR',
169
  'MNSC-PART6-ASR',
 
 
170
  ]
171
 
172
  filters_levelone = sum + dataset_lists
 
167
  'MNSC-PART4-ASR',
168
  'MNSC-PART5-ASR',
169
  'MNSC-PART6-ASR',
170
+ 'SEAME-Dev-Man',
171
+ 'SEAME-Dev-Sge',
172
  ]
173
 
174
  filters_levelone = sum + dataset_lists