Datasets
m-a-p/COIG-CQIA
4261 downloads
['task_categories:question-answering''task_categories:text-classification''task_categories:text-generation'
skt/kobest_v1
4158 downloads
['annotations_creators:expert-generated''language_creators:expert-generated''multilinguality:monolingual'
sahil2801/CodeAlpaca-20k
4139 downloads
['task_categories:text-generation''language:en''license:cc-by-4.0'
RMT-team/babilong
4059 downloads
['language:en''size_categories:10K<n<100K''format:json'
allenai/real-toxicity-prompts
4057 downloads
['multilinguality:monolingual''source_datasets:original''language:en'
olm/gdelt-news-headlines
3990 downloads
['size_categories:10M<n<100M''format:json''modality:text'
chaoscodes/refineweb_pre_500_1
3985 downloads
['license:apache-2.0''size_categories:n<1K''format:json'
sggetao/PwC
3923 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:json'
Salesforce/xlam-function-calling-60k
3886 downloads
['task_categories:question-answering''task_categories:text-generation''task_categories:reinforcement-learning'
laion/OIG
3873 downloads
['license:apache-2.0''size_categories:10M<n<100M''format:json'