Datasets
zicsx/mC4-Hindi-Cleaned-3.0
2241 downloads
['language:hi''size_categories:1M<n<10M''format:parquet'
BeIR/nfcorpus
2239 downloads
['task_categories:text-retrieval''task_ids:entity-linking-retrieval''task_ids:fact-checking-retrieval'
ds4sd/PubTables-1M_OTSL
2237 downloads
['task_categories:object-detection''task_categories:table-to-text''license:other'
ll4ma-lab/grasp-dataset
2236 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
rainbowbridge/x_dataset_41613
2236 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
multi-train/emb-reddit-title-body
2234 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
mozilla-foundation/common_voice_16_0
2234 downloads
['annotations_creators:crowdsourced''language_creators:crowdsourced''multilinguality:multilingual'
tattabio/OMG
2234 downloads
['license:cc-by-sa-4.0''size_categories:100M<n<1B''format:parquet'
etechgrid/music-validation-dataset
2234 downloads
['size_categories:1K<n<10K''format:parquet''modality:audio'
cl-nagoya/ruri-dataset-reranker
2231 downloads
['task_categories:question-answering''language:ja''license:other'