Datasets
distil-whisper/librispeech_long
6525 downloads
['size_categories:n<1K''format:parquet''modality:audio'
nlile/NuminaMath-1.5-RL-Verifiable
6520 downloads
['task_categories:text-generation''task_categories:question-answering''language:en'
speechbrain/LoquaciousSet
6505 downloads
['task_categories:automatic-speech-recognition''annotations_creators:crowdsourced''annotations_creators:machine-generated'
lmms-lab/SEED-Bench
6443 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
HuggingFaceTB/smoltalk
6442 downloads
['language:en''size_categories:1M<n<10M''format:parquet'
applied-ai-018/pretraining_v1-omega_books
6379 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
vicgalle/alpaca-gpt4
6365 downloads
['task_categories:text-generation''task_categories:question-answering''language:en'
chengjunyan1/smollm-12.5-corpus
6359 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
wmt/wmt16
6331 downloads
['task_categories:translation''annotations_creators:no-annotation''language_creators:found'
fixie-ai/gigaspeech
6314 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'