Datasets
LLM4SCIENCE/uparxive_boxed_pdf
6045 downloads
['task_categories:image-to-text''language:en''license:mit'
cfilt/IITB-IndicMonoDoc
6141 downloads
['task_categories:text-generation''language:hi''language:mr'
juletxara/xstory_cloze
6139 downloads
['task_categories:other''annotations_creators:found''language_creators:found'
timaeus/pile-arxiv
6139 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
Kaichengalex/RealSyn100M
6137 downloads
['license:mit''size_categories:10M<n<100M''format:parquet'
proj-persona/PersonaHub
6136 downloads
['task_categories:text-generation''task_categories:text-classification''task_categories:token-classification'
McGill-NLP/WebLINX-full
6133 downloads
['language:en''size_categories:10K<n<100K''arxiv:2402.05930'
javiercanillejas/canillejas
6130 downloads
['region:us']
nvidia/ClimbMix
6096 downloads
['task_categories:text-generation''language:en''license:cc-by-nc-4.0'
valhalla/images
6091 downloads
['size_categories:n<1K''format:imagefolder''modality:image'