Datasets
chandar-lab/UR100P
1113 downloads
['license:cc-by-4.0''size_categories:100M<n<1B''format:csv'
AudioLLMs/Multitask-National-Speech-Corpus-v1-extend
1113 downloads
['size_categories:10M<n<100M''format:parquet''modality:audio'
rag-datasets/rag-mini-bioasq
1112 downloads
['task_categories:question-answering''task_categories:sentence-similarity''language:en'
StormKing99/x_dataset_47268
1112 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
Mxode/BiST
1111 downloads
['task_categories:translation''language:en''language:zh'
cannlytics/cannabis_licenses
1110 downloads
['annotations_creators:expert-generated''language_creators:expert-generated''license:cc-by-4.0'
asapp/slue-phase-2
1110 downloads
['size_categories:10K<n<100K''format:parquet''modality:audio'
UBC-NLP/Casablanca
1110 downloads
['language:ar''license:cc-by-nc-nd-4.0''size_categories:10K<n<100K'
teknium/GPT4-LLM-Cleaned
1109 downloads
['size_categories:10K<n<100K''format:json''modality:text'
qmeeus/voxpopuli
1109 downloads
['size_categories:100K<n<1M''format:parquet''modality:audio'