Datasets
lavita/medical-qa-shared-task-v1-toy
879546 downloads
['size_categories:n<1K''format:parquet''modality:tabular'
Salesforce/wikitext
733000 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
jat-project/jat-dataset-tokenized
674446 downloads
['size_categories:10M<n<100M''format:parquet''modality:timeseries'
openai/gsm8k
545923 downloads
['task_categories:text2text-generation''annotations_creators:crowdsourced''language_creators:crowdsourced'
HuggingFaceFW/fineweb
399281 downloads
['task_categories:text-generation''language:en''license:odc-by'
permutans/fineweb-bbc-news
361861 downloads
['language:en''license:odc-by''size_categories:10M<n<100M'
TAUR-Lab/Taur_CoT_Analysis_Project___gpt-4o-2024-08-06
332415 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
nyu-mll/glue
250100 downloads
['task_categories:text-classification''task_ids:acceptability-classification''task_ids:natural-language-inference'
princeton-nlp/SWE-bench_Verified
248308 downloads
['size_categories:n<1K''format:parquet''modality:text'
allenai/ai2_arc
220975 downloads
['task_categories:question-answering''task_ids:open-domain-qa''task_ids:multiple-choice-qa'