Datasets
gmongaras/CC12M_and_Imagenet21K_Recap
1231 downloads
['size_categories:10M<n<100M''format:parquet''modality:image'
hypnopump/unimol_pretrain
1231 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
danasone/taiga_proza
1220 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
PromptEval/PromptEval_MMLU_full
1227 downloads
['task_categories:question-answering''language:en''license:mit'
Aleph-Alpha/Aleph-Alpha-GermanWeb
1227 downloads
['license:other''size_categories:1B<n<10B''format:parquet'
hlillemark/c4_t5_pretrain
1225 downloads
['size_categories:100M<n<1B''format:parquet''library:datasets'
icedwind/x_dataset_27136
1222 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
zkpbeats/reddit_ds_734775
1221 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
mlfoundations-dev/evalset_2e29
1221 downloads
['size_categories:10K<n<100K''format:parquet''modality:tabular'
openbmb/RLAIF-V-Dataset
1220 downloads
['task_categories:visual-question-answering''language:en''license:cc-by-nc-4.0'