Datasets
wmt/wmt16
6331 downloads
['task_categories:translation''annotations_creators:no-annotation''language_creators:found'
ucla-contextual/contextual_test
6327 downloads
['size_categories:n<1K''format:csv''modality:image'
fixie-ai/gigaspeech
6314 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'
HuggingFaceM4/WebSight
6276 downloads
['language:en''license:cc-by-4.0''size_categories:1M<n<10M'
hanhainebula/bge-multilingual-gemma2-data
6251 downloads
['multilinguality:multilingual''size_categories:1M<n<10M''format:json'
bigcode/starcoderdata
6250 downloads
['task_categories:text-generation''language_creators:crowdsourced''language_creators:expert-generated'
pourmand1376/isna-news
6246 downloads
['task_categories:text-generation''language:fa''license:apache-2.0'
fancyzhx/amazon_polarity
6240 downloads
['task_categories:text-classification''task_ids:sentiment-classification''annotations_creators:crowdsourced'
lmms-lab/NExTQA
6194 downloads
['size_categories:10K<n<100K''format:parquet''modality:tabular'
Open-Orca/FLAN
6183 downloads
['language:en''license:cc-by-4.0''size_categories:100M<n<1B'