Datasets
scikit-learn/iris
6372 downloads
['license:cc0-1.0''size_categories:n<1K''format:csv'
vicgalle/alpaca-gpt4
6365 downloads
['task_categories:text-generation''task_categories:question-answering''language:en'
chengjunyan1/smollm-12.5-corpus
6359 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
mlfoundations/dclm-pool-1b-5x
6356 downloads
['license:cc-by-4.0''region:us']
universal-dependencies/universal_dependencies
6343 downloads
['task_categories:token-classification''task_ids:parsing''annotations_creators:expert-generated'
wmt/wmt16
6331 downloads
['task_categories:translation''annotations_creators:no-annotation''language_creators:found'
ucla-contextual/contextual_test
6327 downloads
['size_categories:n<1K''format:csv''modality:image'
Airtel4141/Sssdmdsff
6326 downloads
['task_categories:text-classification''language:aa''license:apache-2.0'
hr16/kinh-phap-hoa-ke-trom-huong
6323 downloads
['task_categories:text-to-audio''task_categories:text-to-speech''task_categories:automatic-speech-recognition'
fixie-ai/gigaspeech
6314 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'