Datasets
m-a-p/FineFineWeb
1286042 downloads
['task_categories:text-classification''task_categories:text2text-generation''task_categories:text-generation'
lavita/medical-qa-shared-task-v1-toy
879546 downloads
['size_categories:n<1K''format:parquet''modality:tabular'
Salesforce/wikitext
733000 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
openai/gsm8k
545923 downloads
['task_categories:text2text-generation''annotations_creators:crowdsourced''language_creators:crowdsourced'
HuggingFaceFW/fineweb
399281 downloads
['task_categories:text-generation''language:en''license:odc-by'
permutans/fineweb-bbc-news
361861 downloads
['language:en''license:odc-by''size_categories:10M<n<100M'
TAUR-Lab/Taur_CoT_Analysis_Project___gpt-4o-2024-08-06
332415 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
allenai/c4
282943 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
bigcode/commitpackft
271636 downloads
['language:code''license:mit''size_categories:100K<n<1M'
nyu-mll/glue
250100 downloads
['task_categories:text-classification''task_ids:acceptability-classification''task_ids:natural-language-inference'