Datasets
bigcode/the-stack-dedup
4829 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
FiscalNote/billsum
4816 downloads
['task_categories:summarization''annotations_creators:found''language_creators:found'
AI-Lab-Makerere/beans
4814 downloads
['task_categories:image-classification''task_ids:multi-class-image-classification''annotations_creators:expert-generated'
japanese-asr/whisper_transcriptions.mls.wer_10.0
4785 downloads
['size_categories:1M<n<10M''format:parquet''modality:audio'
Salesforce/fineweb_deduplicated
4780 downloads
['license:odc-by''size_categories:1B<n<10B''format:parquet'
CSU-JPG/TextAtlas5M
4737 downloads
['task_categories:text-to-image''language:en''license:mit'
benjamin-paine/imagenet-1k
4646 downloads
['task_categories:image-classification''task_ids:multi-class-image-classification''annotations_creators:crowdsourced'
HuggingFaceGECLM/REDDIT_threaded
4633 downloads
['size_categories:10M<n<100M''format:parquet''modality:tabular'
naver-clova-ix/cord-v2
4604 downloads
['license:cc-by-4.0''size_categories:1K<n<10K''format:parquet'
ai4bharat/IndicVoices
4581 downloads
['license:cc-by-4.0''size_categories:1M<n<10M''format:parquet'