Datasets
MBZUAI/ArabicMMLU
3423 downloads
['task_categories:question-answering''language:ar''license:cc-by-nc-4.0'
epfml/FineWeb2-HQ
3354 downloads
['task_categories:text-generation''language:ru''language:zh'
bigcode/the-stack-v2-train-smol-ids
3297 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
ai4bharat/indic_glue
3245 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:multiple-choice'
csaybar/CloudSEN12-nolabel
3237 downloads
['license:cc-by-nc-4.0''size_categories:10K<n<100K''format:csv'
lerobot/aloha_sim_transfer_cube_human
3236 downloads
['task_categories:robotics''license:mit''size_categories:10K<n<100K'
BByrneLab/multi_task_multi_modal_knowledge_retrieval_benchmark_M2KR
3216 downloads
['language:en''license:mit''size_categories:10M<n<100M'
Intelligent-Internet/wikipedia_en
3170 downloads
['task_categories:feature-extraction''language:en''license:apache-2.0'
HuggingFaceTB/dclm-edu
3151 downloads
['language:en''license:cc-by-4.0''size_categories:1B<n<10B'
IPEC-COMMUNITY/taco_play_lerobot
3148 downloads
['task_categories:robotics''license:apache-2.0''size_categories:100K<n<1M'