Datasets
Cnam-LMSSC/vibravox
7160 downloads
['task_categories:audio-to-audio''task_categories:automatic-speech-recognition''task_categories:audio-classification'
mozilla-foundation/common_voice_13_0
6862 downloads
['task_categories:automatic-speech-recognition''annotations_creators:crowdsourced''language_creators:crowdsourced'
fixie-ai/librispeech_asr
6696 downloads
['language:en''size_categories:100K<n<1M''format:parquet'
mythicinfinity/libritts
6547 downloads
['task_categories:text-to-speech''language:en''license:cc-by-4.0'
distil-whisper/librispeech_long
6525 downloads
['size_categories:n<1K''format:parquet''modality:audio'
speechbrain/LoquaciousSet
6505 downloads
['task_categories:automatic-speech-recognition''annotations_creators:crowdsourced''annotations_creators:machine-generated'
hr16/kinh-phap-hoa-ke-trom-huong
6323 downloads
['task_categories:text-to-audio''task_categories:text-to-speech''task_categories:automatic-speech-recognition'
fixie-ai/gigaspeech
6314 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'
farsi-asr/ganjoor-dataset
5774 downloads
['size_categories:10K<n<100K''format:webdataset''modality:audio'
jp1924/AudioCaps
5761 downloads
['size_categories:10K<n<100K''format:parquet''modality:audio'