| .. |
|
adv_glue
|
init
|
2025-07-18 07:25:44 +00:00 |
|
agieval
|
init
|
2025-07-18 07:25:44 +00:00 |
|
anli
|
init
|
2025-07-18 07:25:44 +00:00 |
|
apps
|
init
|
2025-07-18 07:25:44 +00:00 |
|
ARC_c
|
init
|
2025-07-18 07:25:44 +00:00 |
|
ARC_e
|
init
|
2025-07-18 07:25:44 +00:00 |
|
bbh
|
init
|
2025-07-18 07:25:44 +00:00 |
|
ceval
|
init
|
2025-07-18 07:25:44 +00:00 |
|
civilcomments
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_afqmc
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_C3
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_cmnli
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_CMRC
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_DRCD
|
init
|
2025-07-18 07:25:44 +00:00 |
|
CLUE_ocnli
|
init
|
2025-07-18 07:25:44 +00:00 |
|
cmb
|
init
|
2025-07-18 07:25:44 +00:00 |
|
cmmlu
|
init
|
2025-07-18 07:25:44 +00:00 |
|
collections
|
init
|
2025-07-18 07:25:44 +00:00 |
|
commonsenseqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
crowspairs
|
init
|
2025-07-18 07:25:44 +00:00 |
|
cvalues
|
init
|
2025-07-18 07:25:44 +00:00 |
|
drop
|
init
|
2025-07-18 07:25:44 +00:00 |
|
ds1000
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_bustm
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_chid
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_cluewsc
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_csl
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_eprstmt
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_ocnli_fc
|
init
|
2025-07-18 07:25:44 +00:00 |
|
FewCLUE_tnews
|
init
|
2025-07-18 07:25:44 +00:00 |
|
flores
|
init
|
2025-07-18 07:25:44 +00:00 |
|
game24
|
init
|
2025-07-18 07:25:44 +00:00 |
|
GaokaoBench
|
init
|
2025-07-18 07:25:44 +00:00 |
|
govrepcrs
|
init
|
2025-07-18 07:25:44 +00:00 |
|
gsm8k
|
init
|
2025-07-18 07:25:44 +00:00 |
|
hellaswag
|
init
|
2025-07-18 07:25:44 +00:00 |
|
humaneval
|
init
|
2025-07-18 07:25:44 +00:00 |
|
humanevalx
|
init
|
2025-07-18 07:25:44 +00:00 |
|
iwslt2017
|
init
|
2025-07-18 07:25:44 +00:00 |
|
jigsawmultilingual
|
init
|
2025-07-18 07:25:44 +00:00 |
|
lambada
|
init
|
2025-07-18 07:25:44 +00:00 |
|
lcsts
|
init
|
2025-07-18 07:25:44 +00:00 |
|
leval
|
init
|
2025-07-18 07:25:44 +00:00 |
|
longbench
|
init
|
2025-07-18 07:25:44 +00:00 |
|
math
|
init
|
2025-07-18 07:25:44 +00:00 |
|
mbpp
|
init
|
2025-07-18 07:25:44 +00:00 |
|
mmlu
|
init
|
2025-07-18 07:25:44 +00:00 |
|
narrativeqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
nq
|
init
|
2025-07-18 07:25:44 +00:00 |
|
obqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
piqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
PJExam
|
init
|
2025-07-18 07:25:44 +00:00 |
|
promptbench
|
init
|
2025-07-18 07:25:44 +00:00 |
|
qabench
|
init
|
2025-07-18 07:25:44 +00:00 |
|
qasper
|
init
|
2025-07-18 07:25:44 +00:00 |
|
qaspercut
|
init
|
2025-07-18 07:25:44 +00:00 |
|
race
|
init
|
2025-07-18 07:25:44 +00:00 |
|
realtoxicprompts
|
init
|
2025-07-18 07:25:44 +00:00 |
|
safety
|
init
|
2025-07-18 07:25:44 +00:00 |
|
siqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
squad20
|
init
|
2025-07-18 07:25:44 +00:00 |
|
storycloze
|
init
|
2025-07-18 07:25:44 +00:00 |
|
strategyqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
summedits
|
init
|
2025-07-18 07:25:44 +00:00 |
|
summscreen
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_AX_b
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_AX_g
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_BoolQ
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_CB
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_COPA
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_MultiRC
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_ReCoRD
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_RTE
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_WiC
|
init
|
2025-07-18 07:25:44 +00:00 |
|
SuperGLUE_WSC
|
init
|
2025-07-18 07:25:44 +00:00 |
|
TheoremQA
|
init
|
2025-07-18 07:25:44 +00:00 |
|
triviaqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
triviaqarc
|
init
|
2025-07-18 07:25:44 +00:00 |
|
truthfulqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
tydiqa
|
init
|
2025-07-18 07:25:44 +00:00 |
|
winograd
|
init
|
2025-07-18 07:25:44 +00:00 |
|
winogrande
|
init
|
2025-07-18 07:25:44 +00:00 |
|
XCOPA
|
init
|
2025-07-18 07:25:44 +00:00 |
|
xiezhi
|
init
|
2025-07-18 07:25:44 +00:00 |
|
XLSum
|
init
|
2025-07-18 07:25:44 +00:00 |
|
Xsum
|
init
|
2025-07-18 07:25:44 +00:00 |
|
z_bench
|
init
|
2025-07-18 07:25:44 +00:00 |