Datasets
vidore/syntheticDocQA_artificial_intelligence_test
1416 downloads
['task_categories:visual-question-answering''task_categories:question-answering''language:en'
ClementRomac/cleaned_deduplicated_oscar
1415 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
RMT-team/babilong-1k-samples
1414 downloads
['language:en''size_categories:10K<n<100K''format:parquet'
SimulaMet-HOST/Kvasir-VQA
1413 downloads
['task_categories:visual-question-answering''language:en''license:cc-by-nc-4.0'
Skywork/Skywork-OR1-RL-Data
1411 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
ShoukanLabs/OpenNiji-Dataset-Aesthetic-Finetune-0-15K
1408 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
MongoDB/tech-news-embeddings
1405 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
vidore/docvqa_test_subsampled
1403 downloads
['task_categories:question-answering''task_categories:visual-question-answering''language:en'
lmms-lab/VideoMMMU
1400 downloads
['size_categories:n<1K''format:parquet''modality:image'
allenai/WildChat
1399 downloads
['task_categories:text-generation''task_categories:question-answering''task_categories:text2text-generation'