Datasets
NoamDiamant52/TinyStories_tokenized
590 downloads
['size_categories:100K<n<1M''format:parquet''library:datasets'
vietgpt/the_pile_openwebtext2
589 downloads
['language:en''size_categories:10M<n<100M''format:parquet'
nomic-ai/bert-128-grouped
589 downloads
['size_categories:10M<n<100M''format:parquet''library:datasets'
matlok/python-image-copilot-training-using-class-knowledge-graphs
589 downloads
['task_categories:text-to-image''task_categories:image-to-image''task_categories:question-answering'
Q-bert/DOGE-USD-2023-01-01_2024-08-24
589 downloads
['size_categories:n<1K''format:parquet''library:datasets'
SWE-Gym/SWE-Gym-Lite
589 downloads
['size_categories:n<1K''format:parquet''modality:text'
sentence-transformers/msmarco-msmarco-MiniLM-L6-v3
588 downloads
['task_categories:feature-extraction''task_categories:sentence-similarity''multilinguality:monolingual'
neo4j/text2cypher-2025v1
588 downloads
['language:en''license:apache-2.0''size_categories:10K<n<100K'
timaeus/pile-pubmed_abstracts
587 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
data-is-better-together/10k_prompts_ranked
586 downloads
['task_categories:text-classification''task_categories:text-generation''task_categories:reinforcement-learning'