mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
64 lines
1.6 KiB
Python
64 lines
1.6 KiB
Python
from mmengine.config import read_base
|
|
|
|
with read_base():
|
|
from .groups.agieval import agieval_summary_groups
|
|
from .groups.mmlu import mmlu_summary_groups
|
|
from .groups.cmmlu import cmmlu_summary_groups
|
|
from .groups.ceval import ceval_summary_groups
|
|
from .groups.bbh import bbh_summary_groups
|
|
from .groups.GaokaoBench import GaokaoBench_summary_groups
|
|
from .groups.flores import flores_summary_groups
|
|
from .groups.tydiqa import tydiqa_summary_groups
|
|
from .groups.xiezhi import xiezhi_summary_groups
|
|
|
|
summarizer = dict(
|
|
dataset_abbrs = [
|
|
'--- Exam ---',
|
|
'mmlu',
|
|
"ceval",
|
|
"bbh",
|
|
'--- ChineseUniversal ---',
|
|
'CMRC_dev',
|
|
'DRCD_dev',
|
|
'afqmc-dev',
|
|
'bustm-dev',
|
|
'chid-dev',
|
|
'cluewsc-dev',
|
|
'eprstmt-dev',
|
|
'--- Coding ---',
|
|
'openai_humaneval',
|
|
'mbpp',
|
|
'--- Completion ---',
|
|
'lambada',
|
|
'story_cloze',
|
|
'--- EnglishUniversal ---',
|
|
'AX_b',
|
|
'AX_g',
|
|
'BoolQ',
|
|
'CB',
|
|
'COPA',
|
|
'MultiRC',
|
|
'RTE',
|
|
'ReCoRD',
|
|
'WiC',
|
|
'WSC',
|
|
'race-high',
|
|
'race-middle',
|
|
'--- Reasoning ---',
|
|
'math',
|
|
'gsm8k',
|
|
'summedits',
|
|
'--- QA ---',
|
|
'hellaswag',
|
|
'piqa',
|
|
'winogrande',
|
|
'openbookqa',
|
|
'openbookqa_fact',
|
|
'nq',
|
|
'triviaqa',
|
|
'--- Security ---',
|
|
'crows_pairs',
|
|
],
|
|
summary_groups=sum([v for k, v in locals().items() if k.endswith("_summary_groups")], []),
|
|
)
|