Datasets
mlfoundations/datacomp_1b
3129 downloads
['license:cc-by-4.0''size_categories:1B<n<10B''format:parquet'
wissamantoun/fineweb-edu-format-topic
3119 downloads
['task_categories:text-generation''language:en''license:odc-by'
common-canvas/commoncatalog-cc-by
3109 downloads
['task_categories:text-to-image''language:en''license:cc-by-4.0'
songlab/TraitGym
3099 downloads
['license:mit''size_categories:10M<n<100M''format:parquet'
google-research-datasets/paws
3098 downloads
['task_categories:text-classification''task_ids:semantic-similarity-classification''task_ids:semantic-similarity-scoring'
microsoft/wiki_qa
3094 downloads
['task_categories:question-answering''task_ids:open-domain-qa''annotations_creators:crowdsourced'
Intel/SocialCounterfactuals
3091 downloads
['license:mit''size_categories:100K<n<1M''format:parquet'
argilla/ultrafeedback-binarized-preferences
3087 downloads
['size_categories:10K<n<100K''format:parquet''modality:tabular'
Dahoas/rm-static
3083 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
ARTPARK-IISc/Vaani-transcription-part
3081 downloads
['task_categories:automatic-speech-recognition''language:hi''language:kn'