Datasets
philschmid/guanaco-sharegpt-style
2323 downloads
['size_categories:1K<n<10K''format:parquet''modality:text'
epfml/FineWeb2-embedded
2323 downloads
['task_categories:text-generation''language:ru''language:zh'
sentence-transformers/s2orc
2319 downloads
['task_categories:feature-extraction''task_categories:sentence-similarity''multilinguality:monolingual'
laion/relaion2B-en-research-safe
2316 downloads
['size_categories:1B<n<10B''format:parquet''modality:image'
Babelscape/wikineural
2314 downloads
['task_categories:token-classification''task_ids:named-entity-recognition''annotations_creators:machine-generated'
Kevin355/Who_and_When
2310 downloads
['size_categories:n<1K''format:parquet''modality:text'
hazyresearch/based-squad
2308 downloads
['size_categories:1K<n<10K''format:parquet''modality:text'
snoop2head/enron_aeslc_emails
2300 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
claran/modular-s2orc-parquet
2293 downloads
['license:odc-by''size_categories:1M<n<10M''format:parquet'
Linear-Next/Linear-Next-Datasets
2290 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'