Datasets
oier-mees/BiPlay
3067 downloads
['task_categories:robotics''license:mit''arxiv:2410.10088'
rte-france/RTE7000
3064 downloads
['license:cc-by-sa-4.0''size_categories:n<1K''format:text'
meihualuomanxueshan/Processed_Hypersim
3062 downloads
['license:other''region:us']
rootsautomation/ScreenSpot
3061 downloads
['task_categories:text-generation''task_categories:image-to-text''language:en'
deepghs/game_character_skins
3056 downloads
['size_categories:1K<n<10K''format:imagefolder''modality:image'
cfli/pretrain_wiki
3056 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
miracl/miracl-corpus
3053 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''annotations_creators:expert-generated'
apollo-research/Skylion007-openwebtext-tokenizer-gpt2
3053 downloads
['size_categories:1M<n<10M''format:parquet''library:datasets'
hammh0a/SynthCLIP
713 downloads
['license:cc-by-nc-4.0''arxiv:2402.01832''region:us']
zeta-alpha-ai/NanoMSMARCO
3040 downloads
['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'