Datasets
EleutherAI/fineweb-edu-dedup-10b
1439 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
Charlie911/tmmluplus_CKIP_segmented
1435 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
cc-clean/CC-MAIN-2017-22
1433 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
swj0419/WikiMIA
1432 downloads
['language:en''license:mit''size_categories:1K<n<10K'
M-A-D/Mixed-Arabic-Datasets-Repo
1430 downloads
['task_categories:text-classification''task_categories:question-answering''task_categories:translation'
CausalNLP/gpt2small_full_training_data
1430 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
MakiPan/Hagrid-mediapipe-hand-enc
1426 downloads
['size_categories:100K<n<1M''format:parquet''modality:image'
robert-1111/x_dataset_041134
1426 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
louisbrulenaudet/bofip
1419 downloads
['task_categories:text-generation''task_categories:table-question-answering''task_categories:summarization'
ashraq/esc50
1416 downloads
['size_categories:1K<n<10K''format:parquet''modality:audio'