Datasets
MLCommons/peoples_speech
21238 downloads
['task_categories:automatic-speech-recognition''annotations_creators:crowdsourced''annotations_creators:machine-generated'
mlabonne/FineTome-100k
20937 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
hf-internal-testing/fixtures_image_utils
20836 downloads
['size_categories:n<1K''modality:image''modality:text'
agibot-world/AgiBotWorld-Beta
20683 downloads
['task_categories:other''language:en''size_categories:100M<n<1B'
awwaawwa/BabelDOC-Assets
20580 downloads
['size_categories:n<1K''format:text''modality:text'
google/IFEval
20519 downloads
['task_categories:text-generation''language:en''license:apache-2.0'
prince-canuma/fineweb-CC-MAIN-2024-10-8B-en
20391 downloads
['size_categories:10M<n<100M''format:parquet''modality:tabular'
tahoebio/Tahoe-100M
20061 downloads
['license:cc0-1.0''size_categories:100M<n<1B''format:parquet'
fixie-ai/common_voice_17_0
19608 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'
nkp37/OpenVid-1M
19508 downloads
['task_categories:text-to-video''language:en''license:cc-by-4.0'