Datasets
corto-ai/nsw-caselaw-qa-embed
2270 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
BEE-spoke-data/reddit-title-body-hf
2265 downloads
['task_categories:text-generation''task_categories:text2text-generation''license:odc-by'
cfahlgren1/hub-stats
2261 downloads
['license:apache-2.0''size_categories:1M<n<10M''format:parquet'
vidore/colpali_train_set
2260 downloads
['size_categories:100K<n<1M''format:parquet''modality:image'
VLR-CVC/ComicsPAP
2259 downloads
['language:en''license:cc-by-sa-4.0''size_categories:10K<n<100K'
yimingzhang/novelty-bench
2254 downloads
['size_categories:1K<n<10K''format:parquet''modality:text'
Helsinki-NLP/multiun
2247 downloads
['task_categories:translation''annotations_creators:found''language_creators:found'
jppgks/twitter-financial-news-sentiment
2243 downloads
['license:mit''size_categories:10K<n<100K''format:parquet'
zicsx/mC4-Hindi-Cleaned-3.0
2241 downloads
['language:hi''size_categories:1M<n<10M''format:parquet'
ds4sd/PubTables-1M_OTSL
2237 downloads
['task_categories:object-detection''task_categories:table-to-text''license:other'