Datasets
deepinv/images
8288 downloads
['license:bsd-3-clause''region:us']
BramVanroy/fineweb-2-duckdbs
8046 downloads
['license:odc-by''region:us']
dalle-mini/YFCC100M_OpenAI_subset
8240 downloads
['size_categories:10K<n<100K''modality:image''modality:text'
atokforps/latent_worker_early-a2_01
8233 downloads
['region:us']
yeliudev/VideoMind-Dataset
8219 downloads
['license:bsd-3-clause''arxiv:2503.13444''region:us']
parler-tts/images
8203 downloads
['size_categories:n<1K''format:imagefolder''modality:image'
prince-canuma/fineweb-CC-MAIN-2024-10-1B-en
8190 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
fineinstructions-pretraining/nemotron_synthetic_1T
8174 downloads
['size_categories:1B<n<10B''format:parquet''modality:text'
fineinstructions-pretraining/nemotron_wrap_1T
8150 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
IWSLT/iwslt2017
8149 downloads
['task_categories:translation''annotations_creators:crowdsourced''language_creators:expert-generated'