eval-leaderboard/test-yu.json
2025-10-16 18:10:07 +08:00

16 lines
317 B
JSON

{
"id": "test-yu",
"description": "ChatGPT 3.5",
"owner": "",
"results": {
"ceval": 52.5,
"agieval": 39.9,
"mmlu": 69.1,
"GaokaoBench": 51.1,
"triviaqa": 63.8,
"hellaswag": 79.5,
"cmmlu": 53.9,
"C3": 85.6,
"lambada": 57.5
}
}