Datasets
beomi/KoAlpaca-v1.1a
966 downloads
['task_categories:text-generation''language:ko''size_categories:10K<n<100K'
qmeeus/vp-er-10l
966 downloads
['language:cs''language:de''language:en'
InfoTokenizers/finewebedu-20B
966 downloads
['language:en''size_categories:10M<n<100M''format:parquet'
Mxode/Chinese-Reasoning-Distil-Data
966 downloads
['task_categories:text-generation''language:zh''license:cc-by-sa-4.0'
fineinstructions-pretraining/nemotron_actual_1T
966 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
taln-ls2n/kpbiomed
965 downloads
['task_categories:text-generation''annotations_creators:unknown''language_creators:unknown'
orgcatorg/multilingual
965 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
barc0/200k_HEAVY_gpt4o-description-gpt4omini-code_generated_problems
964 downloads
['task_categories:text-generation''language:en''license:mit'
g1g2g3/032
964 downloads
['size_categories:n<1K''format:json''modality:text'
g1g2g3/020
963 downloads
['size_categories:n<1K''format:json''modality:text'