Datasets
TencentARC/VPData
4670 downloads
['task_categories:image-to-video''task_categories:text-to-video''language:en'
hqfang/SAM2Act
4651 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:webdataset'
benjamin-paine/imagenet-1k
4646 downloads
['task_categories:image-classification''task_ids:multi-class-image-classification''annotations_creators:crowdsourced'
BIOMEDICA/biomedica_webdataset_24M
4636 downloads
['size_categories:n>1T''arxiv:2501.07171''region:us'
katieluo88/MixedSignalsDataset
4634 downloads
['license:odc-by''region:us']
HuggingFaceGECLM/REDDIT_threaded
4633 downloads
['size_categories:10M<n<100M''format:parquet''modality:tabular'
zed-industries/zeta
4624 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
mozilla-foundation/common_voice_15_0
4614 downloads
['task_categories:automatic-speech-recognition''annotations_creators:crowdsourced''language_creators:crowdsourced'
HKUSTAudio/Audio-FLAN-Dataset
4610 downloads
['task_categories:text-to-speech''task_categories:text-to-audio''task_categories:automatic-speech-recognition'
ywchoi/OpenMedText
915 downloads
['language:en''arxiv:2503.09032''region:us'