Datasets
PleIAs/common_corpus
194840 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
CohereLabs/xP3x
185257 downloads
['task_categories:other''annotations_creators:expert-generated''annotations_creators:crowdsourced'
argilla/databricks-dolly-15k-curated-en
164698 downloads
['language:en''size_categories:10K<n<100K''format:parquet'
Salesforce/blip3-kale
159554 downloads
['task_categories:image-to-text''language:en''license:apache-2.0'
jat-project/jat-dataset
149774 downloads
['task_categories:reinforcement-learning''task_categories:text-generation''task_categories:question-answering'
cais/mmlu
139682 downloads
['task_categories:question-answering''task_ids:multiple-choice-qa''annotations_creators:no-annotation'
HuggingFaceFW/fineweb-edu
132752 downloads
['task_categories:text-generation''language:en''license:odc-by'
aps/super_glue
131358 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
allenai/openbookqa
128085 downloads
['task_categories:question-answering''task_ids:open-domain-qa''annotations_creators:crowdsourced'
andstor/methods2test_small
113962 downloads
['task_categories:text-generation''language:en''license:mit'