Datasets
nyu-dice-lab/lm-eval-results-yunconglong-MoE_13B_DPO-private
339 downloads
['size_categories:100K<n<1M''format:json''modality:tabular'
saqlainr/960m06
339 downloads
['size_categories:n<1K''format:json''modality:text'
medalpaca/medical_meadow_wikidoc
338 downloads
['task_categories:question-answering''language:en''license:cc'
stanford-crfm/helm-scenarios
338 downloads
['size_categories:n<1K''format:json''modality:text'
nlpllmeval/NLP-Course-LLM-Reasoning-Eval-May2025
338 downloads
['license:mit''size_categories:n<1K''format:json'
MathGenie/MathCode-Pile
337 downloads
['license:apache-2.0''size_categories:100K<n<1M''format:json'
dan-c212/def_hot4
337 downloads
['size_categories:n<1K''format:json''modality:text'
thomaskim1130/FinanceRAG-Lingua
336 downloads
['language:en''license:mit''size_categories:100K<n<1M'
NovaSky-AI/Sky-T1_data_17k
336 downloads
['license:apache-2.0''size_categories:10K<n<100K''format:json'
Anthropic/model-written-evals
335 downloads
['task_categories:multiple-choice''task_categories:zero-shot-classification''task_categories:question-answering'