Datasets
princeton-nlp/SWE-bench
24935 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
taeminlee/Ko-StrategyQA
24872 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'
dair-ai/emotion
24858 downloads
['task_categories:text-classification''task_ids:multi-class-classification''annotations_creators:machine-generated'
prince-canuma/fineweb-CC-MAIN-2024-10-6B-en
24731 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
opencsg/Fineweb-Edu-Chinese-V2.1
24561 downloads
['task_categories:text-generation''language:zh''license:apache-2.0'
ieasybooks-org/waqfeya-library
24497 downloads
['task_categories:image-to-text''language:ar''license:mit'
bigcode/the-stack
24274 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
bastao/VeraCruz_PT-BR
24155 downloads
['task_categories:text-generation''task_categories:text-classification''language:pt'
BLIP3o/BLIP3o-Pretrain-Long-Caption
24154 downloads
['license:apache-2.0''size_categories:10M<n<100M''format:webdataset'
mit-han-lab/pile-val-backup
23700 downloads
['size_categories:100K<n<1M''format:json''modality:text'