Datasets
chaoscodes/refineweb_pre_500_1
3985 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
hackercupai/hackercup
3983 downloads
['license:apache-2.0''size_categories:n<1K''format:parquet'
pickapic-anonymous/pickapic_v1
3980 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'
allenai/lila
3967 downloads
['license:cc-by-4.0''size_categories:100K<n<1M''modality:text'
lmms-lab/EgoIT-99K
3959 downloads
['size_categories:100K<n<1M''format:parquet''modality:audio'
wmt/wmt19
3956 downloads
['task_categories:translation''annotations_creators:no-annotation''language_creators:found'
Supermaxman/esa-hubble
3951 downloads
['task_categories:text-to-image''language:en''license:cc-by-4.0'
garrethlee/comprehensive-arithmetic-problems-carries
3951 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
capleaf/viVoice
3935 downloads
['task_categories:text-to-speech''language:vi''license:cc-by-nc-sa-4.0'
ServiceNow/repliqa
3927 downloads
['task_categories:question-answering''task_categories:text-classification''annotations_creators:crowdsourced'