Datasets
kashif/nectar_dpo_pairs
2360 downloads
['language:en''license:cc-by-nc-4.0''size_categories:1M<n<10M'
Jakh0103/glotlid_processed
2360 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
BeIR/scifact
2359 downloads
['task_categories:text-retrieval''task_ids:entity-linking-retrieval''task_ids:fact-checking-retrieval'
cyberagent/crello
2359 downloads
['task_categories:unconditional-image-generation''annotations_creators:no-annotation''language_creators:found'
zeta-alpha-ai/NanoSCIDOCS
2358 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'
Muennighoff/flan
2357 downloads
['task_categories:other''annotations_creators:crowdsourced''annotations_creators:expert-generated'
alexandrainst/nordjylland-news-summarization
2356 downloads
['task_categories:summarization''language:da''license:cc0-1.0'
hkust-nlp/PreSelect-100B
2352 downloads
['license:mit''size_categories:10M<n<100M''format:json'
jamendolyrics/jam-alt
2350 downloads
['task_categories:automatic-speech-recognition''multilinguality:multilingual''language:en'
ai4privacy/pii-masking-300k
2350 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:table-question-answering'