Datasets
rjac/all-the-news-2-1-Component-one
102598 downloads
['annotations_creators:Andrew Thompson''annotations_creators:components.one''language:en'
stanfordnlp/imdb
94775 downloads
['task_categories:text-classification''task_ids:sentiment-classification''annotations_creators:expert-generated'
tau/commonsense_qa
90301 downloads
['task_categories:question-answering''task_ids:open-domain-qa''annotations_creators:crowdsourced'
wenknow/reddit_dataset_44
83781 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
mlfoundations/MINT-1T-HTML
82205 downloads
['task_categories:image-to-text''task_categories:text-generation''language:en'
adams-story/datacomp200m
81814 downloads
['size_categories:100M<n<1B''format:parquet''modality:image'
wikimedia/wikipedia
79914 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
HuggingFaceM4/the_cauldron
76296 downloads
['size_categories:1M<n<10M''format:parquet''modality:image'
wyu1/Leopard-Instruct
69938 downloads
['language:en''license:apache-2.0''size_categories:1M<n<10M'
gabrielaltay/pubtator-central-bigbio-kb-2022-12-18
68612 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'