Datasets
gmongaras/CC12M_and_Imagenet21K_Recap_Highqual
2067 downloads
['size_categories:10M<n<100M''format:parquet''modality:image'
yuwd/Polaris
2063 downloads
['task_categories:image-to-text''language:en''license:bsd'
glaiveai/reasoning-v1-20m
2023 downloads
['task_categories:text-generation''language:en''license:apache-2.0'
limingcv/SuperEdit-40K
2021 downloads
['task_categories:image-to-image''size_categories:10K<n<100K''format:parquet'
papluca/language-identification
2060 downloads
['task_categories:text-classification''task_ids:multi-class-classification''multilinguality:multilingual'
llamaindex/vdr-multilingual-train
2057 downloads
['multilinguality:multilingual''language:de''language:it'
momo1942/x_dataset_44829
2055 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
zeta-alpha-ai/NanoTouche2020
2053 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'
picollect/danbooru
2053 downloads
['language:en''license:other''size_categories:10M<n<100M'
recursal/Fanatic-Fandom
2052 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'