Datasets
yywwrr/mmarco_spanish
1699 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
zeta-alpha-ai/NanoFiQA2018
1698 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'
allenai/swag
1697 downloads
['task_categories:text-classification''task_ids:natural-language-inference''annotations_creators:crowdsourced'
Open-Orca/1million-gpt-4
1697 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
google/code_x_glue_cc_cloze_testing_maxmin
1696 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:slot-filling'
gayanin/gcd-noised
1696 downloads
['size_categories:1K<n<10K''format:parquet''modality:text'
moondream/ia_ocr
1694 downloads
['license:openrail''size_categories:100K<n<1M''format:parquet'
HuggingFaceM4/DocumentVQA
1692 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
TimoImhof/TriviaQA-in-SQuAD-format
1691 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
TigerResearch/pretrain_zh
1688 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'