Datasets
EleutherAI/wikitext_document_level
34617 downloads
['license:cc-by-sa-3.0''size_categories:10K<n<100K''format:parquet'
google-research-datasets/mbpp
38770 downloads
['task_categories:text2text-generation''annotations_creators:crowdsourced''annotations_creators:expert-generated'
fancyzhx/ag_news
37795 downloads
['task_categories:text-classification''task_ids:topic-classification''annotations_creators:found'
truthfulqa/truthful_qa
37719 downloads
['task_categories:multiple-choice''task_categories:text-generation''task_categories:question-answering'
nvidia/OpenMathReasoning
36653 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
multimodalart/lora-fusing-preferences
36358 downloads
['license:mit''size_categories:1K<n<10K''format:imagefolder'
nexa-collaboration/fineweb_filtered
35132 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
princeton-nlp/SWE-bench_Lite
35003 downloads
['size_categories:n<1K''format:parquet''modality:text'
tensorshield/reddit_dataset_157
34740 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
occiglot/tokenizer-wiki-bench
33634 downloads
['language:af''language:ar''language:bg'