Datasets
clip-benchmark/wds_mscoco_captions
3436 downloads
['size_categories:10K<n<100K''format:webdataset''modality:image'
mitermix/audiosnippets_small_with_detailed_annotation
3266 downloads
['size_categories:100K<n<1M''format:webdataset''modality:audio'
LLMDH/marianne_pdf_10
2814 downloads
['size_categories:100K<n<1M''format:webdataset''modality:text'
pixparse/idl-wds
2768 downloads
['task_categories:image-to-text''license:other''size_categories:1M<n<10M'
apple/DataCompDR-12M
2709 downloads
['task_categories:text-to-image''task_categories:image-to-text''language:en'
TTS-AGI/emilia-yodas
2600 downloads
['task_categories:text-to-speech''task_categories:automatic-speech-recognition''language:en'
sayakpaul/pickapic_v2_webdataset
2452 downloads
['size_categories:1K<n<10K''format:webdataset''modality:image'
Enxin/Football
2401 downloads
['size_categories:10M<n<100M''format:webdataset''modality:image'
LLMDH/marianne_pdf_3
2347 downloads
['size_categories:100K<n<1M''format:webdataset''modality:text'
nyuuzyou/pxhere
2145 downloads
['task_categories:image-classification''task_categories:image-to-text''task_categories:text-to-image'