Datasets
tanganke/stl10
4147 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
gretelai/synthetic_text_to_sql
4133 downloads
['task_categories:question-answering''task_categories:table-question-answering''task_categories:text-generation'
regent-research/regent-subset-of-jat-dataset-tokenized
4130 downloads
['size_categories:10M<n<100M''format:parquet''modality:timeseries'
dariakern/Chicks4FreeID
4110 downloads
['language:en''license:cc-by-4.0''size_categories:1K<n<10K'
AlignmentResearch/PasswordMatch
4061 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
openlanguagedata/flores_plus
4104 downloads
['task_categories:text2text-generation''task_categories:translation''annotations_creators:found'
toxigen/toxigen-data
4102 downloads
['task_categories:text-classification''task_ids:hate-speech-detection''annotations_creators:expert-generated'
philipp-zettl/mtg_cards-2025-04-04
4091 downloads
['task_categories:sentence-similarity''language:en''size_categories:1M<n<10M'
MykMaks/nordjylland-news-image-captioning
4076 downloads
['task_categories:zero-shot-classification''language:da''size_categories:10K<n<100K'
gpt-omni/VoiceAssistant-400K
4072 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:parquet'