OpenCompass/configs/summarizers/internlm2_keyset.py
Fengzhe Zhou b4afe3e7c1
[Sync] Add InternLM2 Keyset Evaluation Demo (#807)
Co-authored-by: zhangyifan1 <zhangyifan1@pjlab.org.cn>
2024-01-17 13:48:12 +08:00

21 lines
616 B
Python

from mmengine.config import read_base
with read_base():
from .groups.agieval import agieval_summary_groups
from .groups.mmlu import mmlu_summary_groups
from .groups.bbh import bbh_summary_groups
summarizer = dict(
dataset_abbrs=[
['mmlu', 'naive_average'],
['agieval', 'naive_average'],
['bbh', 'naive_average'],
['gsm8k', 'accuracy'],
['math', 'accuracy'],
['openai_humaneval', 'humaneval_pass@1'],
['sanitized_mbpp', 'score'],
],
summary_groups=sum(
[v for k, v in locals().items() if k.endswith("_summary_groups")], []),
)