Datasets
TempestTeam/dataset-the-stack-v2-dedup-sub
1900 downloads
['task_categories:text-generation''license:other''size_categories:10M<n<100M'
nyan102/kagglemodel
1898 downloads
['size_categories:n<1K''format:text''modality:text'
parsee-mizuhashi/phony
1896 downloads
['license:mit''modality:image''modality:text'
openai/mrcr
1896 downloads
['license:mit''size_categories:1K<n<10K''format:parquet'
nomic-ai/cornstack-java-v1
1893 downloads
['license:apache-2.0''size_categories:10M<n<100M''format:json'
BeIR/dbpedia-entity
1886 downloads
['task_categories:text-retrieval''task_ids:entity-linking-retrieval''task_ids:fact-checking-retrieval'
timpal0l/scandisent
1886 downloads
['task_categories:text-classification''language:sv''language:no'
keivalya/MedQuad-MedicalQnADataset
1885 downloads
['task_categories:question-answering''task_categories:text2text-generation''size_categories:10K<n<100K'
argilla/distilabel-capybara-dpo-7k-binarized
1884 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
wecover/OPUS_Europarl
1883 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'