Datasets
Metanova/SAVI-2020
7605 downloads
['size_categories:1B<n<10B''format:csv''modality:tabular'
Lyte/fineweb-edu-2016-26-750k
7604 downloads
['language:en''size_categories:100K<n<1M''format:parquet'
bradfordlevy/BeanCounter
7569 downloads
['size_categories:10M<n<100M''modality:text''arxiv:2409.17827'
BestWishYsh/OpenS2V-5M
7569 downloads
['task_categories:text-to-video''task_categories:image-to-video''language:en'
metchee/u-sticker
7544 downloads
['language:ar''language:zh''language:en'
banned-historical-archives/huaqiaoribao
7540 downloads
['size_categories:1K<n<10K''format:imagefolder''modality:image'
nlphuji/flickr30k
7535 downloads
['size_categories:10K<n<100K''modality:image''modality:text'
ChristophSchuhmann/1-sentence-level-gutenberg-en_arxiv_pubmed_soda
7522 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
Spawning/pd12m-full
7504 downloads
['language:en''license:cdla-permissive-2.0''size_categories:10M<n<100M'
facebook/wiki_dpr
7503 downloads
['task_categories:fill-mask''task_categories:text-generation''task_ids:language-modeling'