Datasets
tensorshield/reddit_dataset_30
2271 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
hf-internal-testing/fill10
2270 downloads
['size_categories:n<1K''format:parquet''modality:image'
bigdata-pw/Flickr
2270 downloads
['task_categories:image-classification''task_categories:image-to-text''task_categories:text-to-image'
corto-ai/nsw-caselaw-qa-embed
2270 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
nvidia/Aegis-AI-Content-Safety-Dataset-2.0
2268 downloads
['task_categories:text-classification''language:en''license:cc-by-4.0'
BEE-spoke-data/reddit-title-body-hf
2265 downloads
['task_categories:text-generation''task_categories:text2text-generation''license:odc-by'
bofenghuang/stt-pseudo-labeled-whisper-large-v3-multilingual
2263 downloads
['license:cc-by-3.0''region:us']
cfahlgren1/hub-stats
2261 downloads
['license:apache-2.0''size_categories:1M<n<10M''format:parquet'
vidore/colpali_train_set
2260 downloads
['size_categories:100K<n<1M''format:parquet''modality:image'
VLR-CVC/ComicsPAP
2259 downloads
['language:en''license:cc-by-sa-4.0''size_categories:10K<n<100K'