Datasets
dylanebert/3dgs
3449 downloads
['size_categories:n<1K''format:json''modality:3d'
clip-benchmark/wds_mscoco_captions
3436 downloads
['size_categories:10K<n<100K''format:webdataset''modality:image'
PaDaS-Lab/webfaq-retrieval
3435 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:multilingual'
DataRobot-Research/crag
3435 downloads
['task_categories:question-answering''language:en''license:apache-2.0'
gaia-benchmark/results_public
3297 downloads
['size_categories:n<1K''format:parquet''modality:tabular'
mteb/sib200
3429 downloads
['task_categories:text-classification''annotations_creators:expert-annotated''language_creators:expert-generated'
MBZUAI/ArabicMMLU
3423 downloads
['task_categories:question-answering''language:ar''license:cc-by-nc-4.0'
aiwithvarun7/theekkathir-text-dataset
3396 downloads
['task_categories:text-generation''language:ta''license:cc-by-nc-4.0'
TwoAbove/the-project-gutenberg-open-audiobook-collection
3391 downloads
['language:en''size_categories:n<1K''format:parquet'
AlignmentResearch/EnronSpam
3390 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'