Datasets
open-r1/Mixture-of-Thoughts
17786 downloads
['task_categories:text-generation''language:en''size_categories:100K<n<1M'
mteb/sickr-sts
17774 downloads
['task_categories:sentence-similarity''task_ids:semantic-similarity-scoring''task_ids:natural-language-inference'
EdinburghNLP/xsum
17758 downloads
['task_categories:summarization''task_ids:news-articles-summarization''annotations_creators:found'
fka/awesome-chatgpt-prompts
17686 downloads
['task_categories:question-answering''license:cc0-1.0''size_categories:n<1K'
gatilin/rf100-vl-datasets
17685 downloads
['license:mit''modality:image''region:us']
lmms-lab/MMMU
17631 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
histai/HISTAI-skin-b2
17484 downloads
['license:cc-by-nc-4.0''arxiv:2505.12120''region:us']
princeton-nlp/prolong-data-64K
17483 downloads
['language:en''arxiv:2410.02660''region:us'
tiiuae/falcon-refinedweb
17426 downloads
['task_categories:text-generation''language:en''license:odc-by'
japanese-asr/whisper_transcriptions.mls.wer_10.0.vectorized
17378 downloads
['size_categories:1M<n<10M''format:parquet''library:datasets'