Datasets
bookcorpus/bookcorpus
14003 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
CohereLabs/include-base-44
14425 downloads
['task_categories:text2text-generation''task_categories:multiple-choice''language:sq'
QingyiSi/Alpaca-CoT
14403 downloads
['language:en''language:zh''language:ml'
uonlp/CulturaX
14348 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
Helsinki-NLP/europarl
14336 downloads
['task_categories:translation''annotations_creators:found''language_creators:found'
argmaxinc/whisperkit-evals-multilingual
14329 downloads
['region:us''whisper''whisperkit'
agkphysics/AudioSet
14268 downloads
['task_categories:audio-classification''source_datasets:original''language:en'
k-l-lambda/NotaGenX-opus
14261 downloads
['license:mit''region:us']
Jiayi-Pan/Countdown-Tasks-3to4
14157 downloads
['size_categories:100K<n<1M''format:parquet''library:datasets'
ember-lab-berkeley/AMASS_Retargeted_for_G1
14151 downloads
['task_categories:robotics''license:cc-by-4.0''size_categories:10K<n<100K'