eval-leaderboard/test-yu.json
2025-10-27 08:23:01 +00:00

16 lines
317 B (Stored with Git LFS)
JSON

{
"id": "test-yu",
"description": "ChatGPT 3.5",
"owner": "",
"results": {
"ceval": 52.5,
"agieval": 39.9,
"mmlu": 69.1,
"GaokaoBench": 51.1,
"triviaqa": 63.8,
"hellaswag": 79.5,
"cmmlu": 53.9,
"C3": 85.6,
"lambada": 57.5
}
}