Datasets
MLP-SEMO/IT_data_old
1419 downloads
['size_categories:100K<n<1M''modality:text''region:us']
HiTZ/casimedicos-exp
1418 downloads
['task_categories:text-generation''task_categories:question-answering''language:en'
sailor2/sea-pdf-text
1417 downloads
['license:odc-by''size_categories:10M<n<100M''format:json'
mteb/medrxiv-clustering-p2p
1416 downloads
['task_categories:text-classification''annotations_creators:derived''multilinguality:monolingual'
ashraq/esc50
1416 downloads
['size_categories:1K<n<10K''format:parquet''modality:audio'
vidore/syntheticDocQA_artificial_intelligence_test
1416 downloads
['task_categories:visual-question-answering''task_categories:question-answering''language:en'
ClementRomac/cleaned_deduplicated_oscar
1415 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
RMT-team/babilong-1k-samples
1414 downloads
['language:en''size_categories:10K<n<100K''format:parquet'
SimulaMet-HOST/Kvasir-VQA
1413 downloads
['task_categories:visual-question-answering''language:en''license:cc-by-nc-4.0'
Xkev/LLaVA-CoT-100k
1412 downloads
['task_categories:visual-question-answering''language:en''license:apache-2.0'