Datasets
Hyper-AI-Computer/KeystoneFuse-Train-Data-Pretrain-V3
3332 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
StormKing99/x_dataset_8191
3322 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
mteb/fiqa
3314 downloads
['task_categories:text-retrieval''task_ids:multiple-choice-qa''annotations_creators:human-annotated'
Amod/mental_health_counseling_conversations
3311 downloads
['task_categories:text-generation''task_categories:question-answering''language:en'
Hothan/OlympiadBench
3305 downloads
['task_categories:question-answering''task_categories:visual-question-answering''language:zh'
lyk/ArxivEmbedding
3305 downloads
['task_categories:text-classification''language:en''size_categories:100K<n<1M'
common-canvas/commoncatalog-cc-by-nc-nd
3297 downloads
['task_categories:text-to-image''language:en''license:cc-by-nc-nd-4.0'
bigcode/the-stack-v2-train-smol-ids
3297 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
zkpbeats/reddit_ds_479243
3295 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
mitermix/audiosnippets_small_with_detailed_annotation
3266 downloads
['size_categories:100K<n<1M''format:webdataset''modality:audio'