34 lines
623 B
JSON
34 lines
623 B
JSON
|
|
{
|
||
|
|
"公开核心榜单": [
|
||
|
|
"ceval",
|
||
|
|
"mmlu",
|
||
|
|
"triviaqa",
|
||
|
|
"hellaswag",
|
||
|
|
"cmmlu",
|
||
|
|
"C3",
|
||
|
|
"lambada"
|
||
|
|
],
|
||
|
|
"私有榜单V1": [
|
||
|
|
"SageBench-exam"
|
||
|
|
],
|
||
|
|
"私有榜单V2": [],
|
||
|
|
"中文": [
|
||
|
|
"ceval",
|
||
|
|
"cmmlu",
|
||
|
|
"C3",
|
||
|
|
"SageBench-exam"
|
||
|
|
],
|
||
|
|
"英文": [
|
||
|
|
"mmlu",
|
||
|
|
"triviaqa",
|
||
|
|
"hellaswag",
|
||
|
|
"lambada"
|
||
|
|
],
|
||
|
|
"长窗口": [
|
||
|
|
"longbench_lsht",
|
||
|
|
"longbench_vcsum",
|
||
|
|
"longbench_dureader",
|
||
|
|
"longbench_multifieldqa_zh",
|
||
|
|
"longbench_passage_retrieval_zh"
|
||
|
|
]
|
||
|
|
}
|