Datasets

open-r1/Mixture-of-Thoughts

17786 downloads

['task_categories:text-generation''language:en''size_categories:100K<n<1M'

mteb/sickr-sts

17774 downloads

['task_categories:sentence-similarity''task_ids:semantic-similarity-scoring''task_ids:natural-language-inference'

EdinburghNLP/xsum

17758 downloads

['task_categories:summarization''task_ids:news-articles-summarization''annotations_creators:found'

fka/awesome-chatgpt-prompts

17686 downloads

['task_categories:question-answering''license:cc0-1.0''size_categories:n<1K'

gatilin/rf100-vl-datasets

17685 downloads

['license:mit''modality:image''region:us']

lmms-lab/MMMU

17631 downloads

['size_categories:10K<n<100K''format:parquet''modality:image'

histai/HISTAI-skin-b2

17484 downloads

['license:cc-by-nc-4.0''arxiv:2505.12120''region:us']

princeton-nlp/prolong-data-64K

17483 downloads

['language:en''arxiv:2410.02660''region:us'

tiiuae/falcon-refinedweb

17426 downloads

['task_categories:text-generation''language:en''license:odc-by'

japanese-asr/whisper_transcriptions.mls.wer_10.0.vectorized

17378 downloads

['size_categories:1M<n<10M''format:parquet''library:datasets'
Previous

Page 35 of 1635

Next