Datasets
bigdata-pw/BIGstockimage35M
7454 downloads
['task_categories:text-to-image''task_categories:image-to-text''language:en'
pixparse/cc3m-wds
5803 downloads
['task_categories:image-to-text''license:other''size_categories:1M<n<10M'
farsi-asr/ganjoor-dataset
5774 downloads
['size_categories:10K<n<100K''format:webdataset''modality:audio'
ZuluVision/RaCig-Data
5236 downloads
['size_categories:10M<n<100M''format:webdataset''modality:text'
mlfoundations/MINT-1T-ArXiv
5230 downloads
['task_categories:image-to-text''task_categories:text-generation''language:en'
litagin/reazon-speech-v2-clone
5078 downloads
['task_categories:automatic-speech-recognition''language:ja''license:other'
MAmmoTH-VL/MAmmoTH-VL-Instruct-12M
4763 downloads
['task_categories:visual-question-answering''task_categories:question-answering''language:en'
hqfang/SAM2Act
4651 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:webdataset'
xingjunm/WildDeepfake
4357 downloads
['license:apache-2.0''size_categories:1M<n<10M''format:webdataset'
timm/imagenet-22k-wds
4356 downloads
['task_categories:image-classification''license:other''size_categories:100K<n<1M'