Datasets
AlignmentResearch/EnronSpam
3390 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
UCSC-VLAA/MedTrinity-25M
3368 downloads
['task_categories:question-answering''language:en''size_categories:10M<n<100M'
wecover/OPUS_Tatoeba
3364 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
CohereLabs/Global-MMLU-Lite
3364 downloads
['language:en''language:ar''language:bn'
stanfordnlp/coqa
3358 downloads
['task_categories:question-answering''task_ids:extractive-qa''annotations_creators:crowdsourced'
epfml/FineWeb2-HQ
3354 downloads
['task_categories:text-generation''language:ru''language:zh'
zechen-nlp/MNLP_STEM_mcqa_demo
3351 downloads
['size_categories:n<1K''format:parquet''modality:text'
Hyper-AI-Computer/KeystoneFuse-Train-Data-Pretrain-V3
3332 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
StormKing99/x_dataset_8191
3322 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
3318 downloads
['size_categories:100K<n<1M''format:parquet''library:datasets'