Datasets
TwoAbove/the-project-gutenberg-open-audiobook-collection
3391 downloads
['language:en''size_categories:n<1K''format:parquet'
AlignmentResearch/EnronSpam
3390 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
YWjimmy/PeRFception-v1-1
3370 downloads
['modality:image''region:us']
qinbright99/mllm-eval
3369 downloads
['license:mit''size_categories:100K<n<1M''modality:text'
UCSC-VLAA/MedTrinity-25M
3368 downloads
['task_categories:question-answering''language:en''size_categories:10M<n<100M'
wecover/OPUS_Tatoeba
3364 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
CohereLabs/Global-MMLU-Lite
3364 downloads
['language:en''language:ar''language:bn'
lesserfield/4chan-datasets
3361 downloads
['task_categories:text-generation''language:en''license:unlicense'
CodedotAI/code_clippy_github
3359 downloads
['task_ids:language-modeling''language_creators:crowdsourced''language_creators:expert-generated'
stanfordnlp/coqa
3358 downloads
['task_categories:question-answering''task_ids:extractive-qa''annotations_creators:crowdsourced'