Datasets
bastao/VeraCruz_PT-BR
24155 downloads
['task_categories:text-generation''task_categories:text-classification''language:pt'
BLIP3o/BLIP3o-Pretrain-Long-Caption
24154 downloads
['license:apache-2.0''size_categories:10M<n<100M''format:webdataset'
openbmb/Ultra-FineWeb
20932 downloads
['task_categories:text-generation''language:en''language:zh'
legacy-datasets/c4
24069 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
hltcoe/megawika
24008 downloads
['task_categories:summarization''task_categories:question-answering''task_categories:text-generation'
allenai/reward-bench-results
23748 downloads
['region:us']
mit-han-lab/pile-val-backup
23700 downloads
['size_categories:100K<n<1M''format:json''modality:text'
mandarjoshi/trivia_qa
23547 downloads
['task_categories:question-answering''task_categories:text2text-generation''task_ids:open-domain-qa'
su-fmi/msi-drone-crop-surveys
23440 downloads
['language:en''license:cc-by-4.0''size_categories:1K<n<10K'
mlfoundations/MINT-1T-PDF-CC-2023-23
23292 downloads
['task_categories:image-to-text''task_categories:text-generation''language:en'