Datasets
openlanguagedata/flores_plus
4104 downloads
['task_categories:text2text-generation''task_categories:translation''annotations_creators:found'
nyuuzyou/subdomains
4103 downloads
['task_categories:other''annotations_creators:machine-generated''language_creators:found'
toxigen/toxigen-data
4102 downloads
['task_categories:text-classification''task_ids:hate-speech-detection''annotations_creators:expert-generated'
HOIGen/HOIGen-1M
4101 downloads
['task_categories:text-to-video''language:en''license:apache-2.0'
philipp-zettl/mtg_cards-2025-04-04
4091 downloads
['task_categories:sentence-similarity''language:en''size_categories:1M<n<10M'
clip-benchmark/wds_fer2013
4083 downloads
['size_categories:10K<n<100K''format:webdataset''modality:image'
MykMaks/nordjylland-news-image-captioning
4076 downloads
['task_categories:zero-shot-classification''language:da''size_categories:10K<n<100K'
dai22dai/video
4073 downloads
['license:other''size_categories:1K<n<10K''format:imagefolder'
gpt-omni/VoiceAssistant-400K
4072 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:parquet'
simon3000/genshin-voice
4065 downloads
['task_categories:audio-classification''task_categories:automatic-speech-recognition''task_categories:text-to-speech'