eval-leaderboard/4pd-niotest-main.json

33 lines
810 B
JSON
Raw Normal View History

2025-10-16 10:10:07 +00:00
{
"id": "4pd/niotest@main",
"description": "nio test eval rank",
"updatedAt": "2023-11-14 15:56:15",
"owner": "nio",
"results": {
"ceval": 59.92,
"mmlu": 55.46,
"triviaqa": 55.98,
"hellaswag": 71.76,
"cmmlu": 62.03,
"C3": 72.0,
"lambada": 66.83,
"SageBench-exam": 75.04,
"CValues-Responsibility": 90.07,
"longbench_lsht": 90.07,
"longbench_vcsum": 90.07,
"longbench_dureader": 90.07,
"longbench_multifieldqa_zh": 90.07,
"longbench_passage_retrieval_zh": 90.07
},
"metadata": {
"language": [
"zh",
"en"
],
"tags": [
"qwen"
],
"pipeline_tag": "text-generation",
"inference": false
}
}