Datasets
nvidia/Llama-Nemotron-Post-Training-Dataset
12177 downloads
['license:cc-by-4.0''size_categories:1M<n<10M''format:json'
FreedomIntelligence/medical-o1-reasoning-SFT
11823 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
mii-llm/results
10884 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
Avelina/smollm-corpus-cleaned
10162 downloads
['task_categories:text-generation''language:en''license:odc-by'
facebook/belebele
9849 downloads
['task_categories:question-answering''task_categories:zero-shot-classification''task_categories:text-classification'
stingning/ultrachat
9619 downloads
['task_categories:text-generation''language:en''license:mit'
IPEC-COMMUNITY/OpenFly
9278 downloads
['size_categories:100K<n<1M''format:json''modality:text'
PortPy-Project/PortPy_Dataset
8967 downloads
['language:en''license:cc-by-nc-4.0''size_categories:n<1K'
llamafactory/alpaca_gpt4_zh
8511 downloads
['task_categories:text-generation''task_categories:question-answering''language:zh'
tokyotech-llm/swallow-code
7999 downloads
['task_categories:text-generation''language:en''language:ja'