mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
26 lines
885 B
Python
26 lines
885 B
Python
from mmengine.config import read_base
|
|
|
|
with read_base():
|
|
from .groups.mathbench_agent import mathbench_agent_summary_groups
|
|
|
|
summarizer = dict(
|
|
dataset_abbrs=[
|
|
'######## GSM8K-Agent Accuracy ########', # category
|
|
['gsm8k-agent', 'follow_acc'],
|
|
['gsm8k-agent', 'reasoning_acc'],
|
|
['gsm8k-agent', 'code_acc'],
|
|
['gsm8k-agent', 'action_pct'],
|
|
'######## MATH-Agent Accuracy ########', # category
|
|
['math-agent', 'follow_acc'],
|
|
['math-agent', 'reasoning_acc'],
|
|
['math-agent', 'code_acc'],
|
|
['math-agent', 'action_pct'],
|
|
'######## MathBench-Agent Accuracy ########', # category
|
|
'mathbench-agent',
|
|
'mathbench-circular-agent',
|
|
'mathbench-circular-and-cloze-agent',
|
|
],
|
|
summary_groups=sum(
|
|
[v for k, v in locals().items() if k.endswith('_summary_groups')], [])
|
|
)
|