Datasets
tensorshield/reddit_dataset_217
582 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
aisi-whitebox/zhou_et_al_factual_statements
582 downloads
['size_categories:n<1K''format:parquet''modality:text'
datablations/c4-filter
581 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
TimKoornstra/financial-tweets-sentiment
581 downloads
['task_categories:text-classification''language:en''license:mit'
maywell/korean_textbooks
581 downloads
['language:ko''license:apache-2.0''size_categories:1M<n<10M'
codeparrot/codeparrot-train-more-filtering
580 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
CoIR-Retrieval/CodeSearchNet-ccr-go-queries-corpus
580 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
japanese-asr/whisper_transcriptions.reazon_speech_all.wer_10.0
580 downloads
['size_categories:1M<n<10M''format:parquet''modality:audio'
SaylorTwift/the_pile_books3_minus_gutenberg
579 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
saitsharipov/CelebA-HQ
579 downloads
['license:unknown''size_categories:100K<n<1M''format:parquet'