Datasets
SynthLabsAI/PERSONA
3692 downloads
['language:en''license:cc-by-nc-sa-4.0''size_categories:100K<n<1M'
EuropeanParliament/Eurovoc
3691 downloads
['license:eupl-1.1''size_categories:1M<n<10M''format:json'
joey234/vi_crawl
2937 downloads
['size_categories:1M<n<10M''format:webdataset''modality:text'
ZechengLi19/CSL-News
3674 downloads
['task_categories:video-text-to-text''language:zh''license:cc-by-nc-4.0'
sentence-transformers/parallel-sentences-ccmatrix
3662 downloads
['task_categories:feature-extraction''task_categories:sentence-similarity''language:af'
m-a-p/SuperGPQA
3659 downloads
['task_categories:text2text-generation''language:en''license:odc-by'
garrethlee/comprehensive-arithmetic-problems
3651 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
lambdalabs/naruto-blip-captions
3640 downloads
['size_categories:1K<n<10K''format:parquet''modality:image'
livebench/language
3633 downloads
['size_categories:n<1K''format:parquet''modality:text'
ChristophSchuhmann/wikipedia-en-nov22-1-sentence-level
3623 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'