Skip to content

Commit

Permalink
add aishell-3 dataset
Browse files Browse the repository at this point in the history
  • Loading branch information
SuperKogito committed Jun 23, 2024
1 parent 527b362 commit 0312e33
Showing 1 changed file with 15 additions and 1 deletion.
16 changes: 15 additions & 1 deletion src/ser-datasets.json
Original file line number Diff line number Diff line change
Expand Up @@ -228,7 +228,7 @@
"Content": "10045 video-audio clips in the wild.",
"Emotions": "11 single-label emotion categories (anger, disgust, fear, happiness, neutral, sadness, surprise, contempt, anxiety, helplessness, and disappointment) and 32 multi-label emotion categories.",
"Format": "Audio, Video",
"Size": "58 GB",
"Size": "--",
"Language": "--",
"Paper": "MAFW: A Large-scale, Multi-modal, Compound Affective Database for Dynamic Facial Expression Recognition in the Wild",
"Access": "Restricted",
Expand Down Expand Up @@ -461,6 +461,20 @@
"Paper-link": "http://www.interspeech2020.org/index.php?m=content&c=index&a=show&catid=290&id=684",
"License-link": "Academic License & Commercial License"
},
"AISHELL-3": {
"Year": 2020,
"Content": "Roughly 85 hours of emotion-neutral recordings spoken by 218 native Chinese mandarin speakers and total 88035 utterances.",
"Emotions": "Neutral",
"Format": "Audio",
"Size": "19 GB",
"Language": "Chinese (Mandarin)",
"Paper": "AISHELL-3: A Multi-speaker Mandarin TTS Corpus and the Baselines",
"Access": "Open",
"License": "Apache 2.0",
"Dataset-link": "https://www.openslr.org/93/",
"Paper-link": "https://arxiv.org/abs/2010.11567",
"License-link": "https://apache.org/licenses/LICENSE-2.0"
},
"BEASC": {
"Year": 2020,
"Content": "Bangla Emotional Audio-Speech Corpus",
Expand Down

0 comments on commit 0312e33

Please sign in to comment.