Datasets
EleutherAI/hendrycks_math
26925 downloads
['license:mit''size_categories:10K<n<100K''format:parquet'
HPLT/HPLT2.0_cleaned
26753 downloads
['task_categories:fill-mask''task_categories:text-generation''task_ids:language-modeling'
roneneldan/TinyStories
26605 downloads
['task_categories:text-generation''language:en''license:cdla-sharing-1.0'
open-r1/OpenR1-Math-220k
26203 downloads
['language:en''license:apache-2.0''size_categories:100K<n<1M'
baber/piqa
25890 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
MERaLiON/Multitask-National-Speech-Corpus-v1
25607 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'
rajpurkar/squad_v2
25600 downloads
['task_categories:question-answering''task_ids:open-domain-qa''task_ids:extractive-qa'
FredZhang7/stable-diffusion-prompts-2.47M
25387 downloads
['task_categories:text-generation''language:en''license:creativeml-openrail-m'
SparkAudio/voxbox
25120 downloads
['task_categories:text-to-speech''language:zh''language:en'
asahi417/seamless-align-enA-frA.speaker-embedding.xlsr-2b
25042 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'