Datasets
epfml/FineWeb2-HQ
3354 downloads
['task_categories:text-generation''language:ru''language:zh'
zechen-nlp/MNLP_STEM_mcqa_demo
3351 downloads
['size_categories:n<1K''format:parquet''modality:text'
3dlg-hcvc/omages_ABO
3350 downloads
['task_categories:text-to-3d''license:cc-by-4.0''modality:image'
sail/regmix-data
3337 downloads
['language:en''license:mit''size_categories:10M<n<100M'
Hyper-AI-Computer/KeystoneFuse-Train-Data-Pretrain-V3
3332 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
InstaDeepAI/nucleotide_transformer_downstream_tasks_revised
3331 downloads
['region:us']
Xinran0906/SA-1B
3327 downloads
['region:us']
WitchesSocialStream/Four-Leaf-Clover
3323 downloads
['license:cc-by-4.0''region:us''not-for-all-audiences']
StormKing99/x_dataset_8191
3322 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
3318 downloads
['size_categories:100K<n<1M''format:parquet''library:datasets'