Datasets
sentence-transformers/msmarco-bm25
5941 downloads
['task_categories:feature-extraction''task_categories:sentence-similarity''multilinguality:monolingual'
OpenGVLab/ShareGPT-4o
5840 downloads
['task_categories:visual-question-answering''task_categories:question-answering''language:en'
asahi417/seamless-align-enA-frA.speaker-embedding.w2vbert-600m
5696 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
xuejun72/HR-VILAGE-3K3M
5679 downloads
['task_categories:zero-shot-classification''task_categories:feature-extraction''task_categories:token-classification'
deepghs-wip/Renai-Circulation
5386 downloads
['annotations_creators:no-annotation''source_datasets:pixiv''language:en'
rungalileo/ragbench
5370 downloads
['license:cc-by-4.0''size_categories:10K<n<100K''format:parquet'
bigcode/the-stack-smol-xs
5337 downloads
['task_categories:text-generation''task_ids:language-modeling''language_creators:crowdsourced'
UCSC-VLAA/Recap-DataComp-1B
5308 downloads
['task_categories:zero-shot-classification''task_categories:text-retrieval''task_categories:image-to-text'
luca-g97/dolma-v1_7-50B-second-phase
5261 downloads
['size_categories:100M<n<1B''format:json''modality:tabular'
maykcaldas/smiles-transformers
5154 downloads
['language:en''license:mit''size_categories:1B<n<10B'