Datasets
qinjiushao7/qin-jiushao
5777 downloads
['region:us']
lishiqianhugh/globaltomo
90204 downloads
['license:cc-by-nc-sa-4.0''region:us']
cerebras/SlimPajama-627B
84437 downloads
['task_categories:text-generation''language:en''arxiv:2306.01116'
monology/pile-uncopyrighted
84245 downloads
['license:other''size_categories:1M<n<10M''format:json'
bigscience/xP3
83835 downloads
['task_categories:other''annotations_creators:expert-generated''annotations_creators:crowdsourced'
society-ethics/stable-bias-generations
83817 downloads
['modality:image''region:us']
wenknow/reddit_dataset_44
83781 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
T-NOVA/NO_SCORE
83663 downloads
['size_categories:100M<n<1B''format:csv''modality:text'
amphion/Emilia-Dataset
82509 downloads
['task_categories:text-to-speech''task_categories:automatic-speech-recognition''language:zh'
EleutherAI/lambada_openai
82259 downloads
['task_ids:language-modeling''language_creators:machine-generated''multilinguality:translation'