Datasets
teven/github_all_lang_filtered
1130 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
nielsr/docvqa_1200_examples
1130 downloads
['size_categories:1K<n<10K''format:parquet''modality:image'
sorenmulli/nordjylland-news-summarization-subset
1130 downloads
['size_categories:n<1K''format:parquet''modality:tabular'
flwrlabs/femnist
1129 downloads
['task_categories:image-classification''license:bsd-2-clause''size_categories:100K<n<1M'
Muennighoff/xP3x-sample
1128 downloads
['task_categories:other''annotations_creators:expert-generated''annotations_creators:crowdsourced'
kenhktsui/openwebtext_quality_score_v1
1128 downloads
['task_categories:text-generation''language:en''license:cc0-1.0'
BangumiBase/skipbeat
1126 downloads
['license:mit''size_categories:1K<n<10K''modality:image'
ClusterlabAi/101_billion_arabic_words_dataset
1126 downloads
['task_categories:text-generation''language:ar''license:apache-2.0'
nbettencourt/SC454k-formatted
1126 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
ai4bharat/indic-align
1125 downloads
['task_categories:text-generation''language:as''language:bn'