Datasets
ryoungj/bootstrap-latent-thought-data
2929 downloads
['task_categories:text-generation''license:apache-2.0''size_categories:10M<n<100M'
bigcode/the-stack-v2
2916 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
hiyouga/math12k
2910 downloads
['task_categories:question-answering''language:en''license:mit'
makaveli10/whisper-hindi-preprocessed
2909 downloads
['size_categories:1K<n<10K''format:parquet''library:datasets'
BEE-spoke-data/code_contests_instruct
2908 downloads
['task_categories:text-generation''source_datasets:teven/code_contests''source_datasets:deepmind/code_contests'
starriver030515/FUSION-Pretrain-10M
2900 downloads
['task_categories:question-answering''task_categories:visual-question-answering''task_categories:table-question-answering'
joujiboi/japanese-anime-speech
2897 downloads
['task_categories:automatic-speech-recognition''language:ja''license:cc0-1.0'
Salesforce/cota-mantis
2894 downloads
['license:cc-by-nc-4.0''size_categories:1M<n<10M''format:parquet'
cardiffnlp/databench
2890 downloads
['task_categories:table-question-answering''task_categories:question-answering''language:en'
simplescaling/s1K-1.1
2890 downloads
['language:en''license:mit''size_categories:1K<n<10K'