Datasets
lyk/PaperDigestDataBase
1901 downloads
['license:mit''size_categories:n<1K''format:parquet'
TempestTeam/dataset-the-stack-v2-dedup-sub
1900 downloads
['task_categories:text-generation''license:other''size_categories:10M<n<100M'
openai/mrcr
1896 downloads
['license:mit''size_categories:1K<n<10K''format:parquet'
lerobot/aloha_sim_insertion_human
1887 downloads
['task_categories:robotics''license:mit''size_categories:10K<n<100K'
argilla/distilabel-capybara-dpo-7k-binarized
1884 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
wecover/OPUS_Europarl
1883 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
aklein4/chat-compilation-benchmark-5x-Llama-3.2-Instruct-Shuffled
1883 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
matlok/python-text-copilot-training-instruct-ai-research-2024-02-11
1880 downloads
['task_categories:text-generation''task_categories:question-answering''task_ids:parsing'
gayanin/babylon-native-v8-noise-op-wise
1878 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
HuggingFaceH4/helpful-instructions
1877 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:parquet'