Datasets
instruction-pretrain/ft-instruction-synthesizer-collection
2395 downloads
['task_categories:text-classification''task_categories:table-question-answering''task_categories:question-answering'
Muennighoff/flan
2357 downloads
['task_categories:other''annotations_creators:crowdsourced''annotations_creators:expert-generated'
hkust-nlp/PreSelect-100B
2352 downloads
['license:mit''size_categories:10M<n<100M''format:json'
ai4privacy/pii-masking-300k
2350 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:table-question-answering'
FreedomIntelligence/PubMedVision
2321 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
NousResearch/hermes-function-calling-v1
2317 downloads
['task_categories:text-generation''task_categories:question-answering''task_categories:feature-extraction'
mteb/scidocs
2312 downloads
['task_categories:text-retrieval''multilinguality:monolingual''language:eng'
sailor2/sailor2-pretrain-data-stage1
2300 downloads
['license:odc-by''size_categories:100M<n<1B''format:json'
mteb/medrxiv-clustering-s2s
2277 downloads
['task_categories:text-classification''annotations_creators:derived''multilinguality:monolingual'
kanhatakeyama/wizardlm8x22b-logical-math-coding-sft
2272 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:json'