Datasets

turing-motors/CoVLA-Dataset

2348 downloads

['language:en''size_categories:10K<n<100K''modality:text'

LLMDH/marianne_pdf_3

2347 downloads

['size_categories:100K<n<1M''format:webdataset''modality:text'

zeta-alpha-ai/NanoNQ

2342 downloads

['task_categories:text-retrieval''task_ids:document-retrieval''multilinguality:monolingual'

PrimeIntellect/INTELLECT-2-RL-Dataset

2332 downloads

['license:apache-2.0''size_categories:100K<n<1M''format:parquet'

MeissonFlow/park

2283 downloads

['license:apache-2.0''size_categories:1M<n<10M''format:parquet'

ai4bharat/samanantar

2330 downloads

['task_categories:text-generation''task_categories:translation''annotations_creators:no-annotation'

princeton-nlp/QuRatedPajama-260B

2330 downloads

['size_categories:100M<n<1B''format:parquet''modality:tabular'

cc-clean/CC-MAIN-2017-39

2329 downloads

['size_categories:100M<n<1B''format:parquet''modality:text'

philschmid/guanaco-sharegpt-style

2323 downloads

['size_categories:1K<n<10K''format:parquet''modality:text'

epfml/FineWeb2-embedded

2323 downloads

['task_categories:text-generation''language:ru''language:zh'
Previous

Page 109 of 1635

Next