Datasets
zed-industries/zeta
4624 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
google/wmt24pp
4534 downloads
['task_categories:translation''language:ar''language:bg'
m-a-p/MAP-CC
4467 downloads
['license:cc-by-nc-nd-4.0''size_categories:1B<n<10B''format:json'
Weyaxi/sci-datasets
4385 downloads
['license:other''size_categories:100K<n<1M''format:json'
PKU-Alignment/BeaverTails
4380 downloads
['task_categories:text-classification''language:en''license:cc-by-nc-4.0'
m-a-p/PIN-14M
4379 downloads
['language:en''language:zh''license:apache-2.0'
common-pile/comma_v0.1_training_dataset
4313 downloads
['size_categories:1B<n<10B''format:json''modality:text'
chonkie-ai/recipes
4165 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
mteb/amazon_massive_scenario
4281 downloads
['task_categories:text-classification''annotations_creators:human-annotated''multilinguality:translated'
teknium/OpenHermes-2.5
4278 downloads
['language:eng''size_categories:1M<n<10M''format:json'