OpenCompass/opencompass/configs/summarizers/judgerbenchv2.py
bittersweet1999 37cbaf8d92
[Add] Add Judgerbenchv2 (#2067)
* fix pip version

* fix pip version

* add judgerbenchv2

* Update __init__.py
2025-04-30 17:12:34 +08:00

16 lines
475 B
Python

tasks = ['Code_and_AI', 'Creation', 'LanTask', 'IF', 'chatQA', 'Hallucination', 'safe', 'Reason_and_analysis', 'Longtext', 'Knowledge']
Judgerbenchv2_summary_names = [[task, 'final_score'] for task in tasks]
Judgerbenchv2_summary_groups = [
{'name': 'Judgerbenchv2', 'subsets': [[name, metric] for name, metric in Judgerbenchv2_summary_names]}
]
summarizer = dict(
dataset_abbrs=[
'Judgerbenchv2'
],
summary_groups=Judgerbenchv2_summary_groups,
)