Datasets
snoop2head/enron_aeslc_emails
2300 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
sailor2/sailor2-pretrain-data-stage1
2300 downloads
['license:odc-by''size_categories:100M<n<1B''format:json'
claran/modular-s2orc-parquet
2293 downloads
['license:odc-by''size_categories:1M<n<10M''format:parquet'
mshah1/speech_robust_bench
2291 downloads
['size_categories:1M<n<10M''modality:audio''modality:text'
Linear-Next/Linear-Next-Datasets
2290 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
mahdibaghbanzadeh/parent
2283 downloads
['size_categories:10M<n<100M''format:text''modality:text'
NiniCat/MMLU-SR
2281 downloads
['task_categories:question-answering''task_ids:multiple-choice-qa''annotations_creators:expert-generated'
google/xquad
2279 downloads
['task_categories:question-answering''task_ids:extractive-qa''annotations_creators:expert-generated'
AI4Math/MathVerse
2279 downloads
['task_categories:multiple-choice''task_categories:question-answering''task_categories:visual-question-answering'
xcodemind/webcode2m
2279 downloads
['task_categories:image-to-text''license:cc-by-4.0''size_categories:1M<n<10M'