Datasets
iohadrubin/codeparrot-train-v2-near-dedup-safe
1014 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
CG-Bench/CG-Bench
1012 downloads
['task_categories:visual-question-answering''language:en''license:mit'
gneubig/aime-1983-2024
1012 downloads
['task_categories:text-classification''language:en''license:cc0-1.0'
google/MusicCaps
1005 downloads
['task_categories:text-to-speech''language:en''license:cc-by-sa-4.0'
nyu-dice-lab/wavepulse-radio-raw-transcripts
1005 downloads
['task_categories:text-generation''task_categories:text-classification''task_ids:news-articles-summarization'
RioYokotaLab/fineweb-edu
1005 downloads
['size_categories:100M<n<1B''format:json''modality:tabular'
asahi417/seamless-align-enA-jaA.speaker-embedding.hubert-xl
999 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'
latam-gpt/red_pajama_es_hq
994 downloads
['language:es''size_categories:100M<n<1B''format:parquet'
Magpie-Align/Llama-3-Magpie-Pro-1M-v0.1
992 downloads
['language:en''license:llama3''size_categories:1M<n<10M'
tdavidson/hate_speech_offensive
989 downloads
['task_categories:text-classification''annotations_creators:expert-generated''annotations_creators:crowdsourced'