Datasets
ontocord/CulturaY
16926 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
mteb/biosses-sts
16653 downloads
['task_categories:sentence-similarity''task_ids:semantic-similarity-scoring''annotations_creators:derived'
LLM360/K2Datasets
15146 downloads
['license:odc-by''size_categories:100K<n<1M''format:json'
mteb/amazon_massive_intent
15090 downloads
['task_categories:text-classification''annotations_creators:human-annotated''multilinguality:translated'
ChongyanChen/VQAonline
14860 downloads
['task_categories:visual-question-answering''license:cc-by-sa-4.0''size_categories:10K<n<100K'
nkandpa2/common-pile-filtered
14538 downloads
['size_categories:1B<n<10B''format:json''modality:text'
a-m-team/AM-DeepSeek-Distilled-40M
13732 downloads
['task_categories:text-generation''language:zh''language:en'
Anthropic/hh-rlhf
12573 downloads
['license:mit''size_categories:100K<n<1M''format:json'
OpenGVLab/MVBench
12512 downloads
['task_categories:visual-question-answering''task_categories:video-classification''language:en'
openbmb/DCAD-2000
12305 downloads
['multilinguality:multilingual''language:eng''language:rus'