Datasets
HuggingFaceGECLM/REDDIT_comments
16505 downloads
['task_categories:text-generation''task_ids:dialogue-modeling''task_ids:language-modeling'
lmms-lab/GQA
16475 downloads
['license:mit''size_categories:10M<n<100M''format:parquet'
nuprl/MultiPL-E
16360 downloads
['annotations_creators:machine-generated''language_creators:machine-generated''language_creators:expert-generated'
MathLLMs/MathVision
16344 downloads
['task_categories:question-answering''task_categories:multiple-choice''task_categories:visual-question-answering'
ylacombe/cml-tts
16256 downloads
['task_categories:text-to-speech''task_categories:text-to-audio''language:nl'
SwayStar123/preprocessed_commoncatalog-cc-by
15395 downloads
['language:en''license:cc-by-4.0''size_categories:10M<n<100M'
cais/wmdp
14970 downloads
['task_categories:text-generation''language:en''license:mit'
HuggingFaceTB/smol-smoltalk
14892 downloads
['language:en''license:apache-2.0''size_categories:100K<n<1M'
uonlp/CulturaX
14348 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
Helsinki-NLP/europarl
14336 downloads
['task_categories:translation''annotations_creators:found''language_creators:found'