mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
16 lines
475 B
Python
16 lines
475 B
Python
![]() |
|
||
|
tasks = ['Code_and_AI', 'Creation', 'LanTask', 'IF', 'chatQA', 'Hallucination', 'safe', 'Reason_and_analysis', 'Longtext', 'Knowledge']
|
||
|
Judgerbenchv2_summary_names = [[task, 'final_score'] for task in tasks]
|
||
|
|
||
|
|
||
|
Judgerbenchv2_summary_groups = [
|
||
|
{'name': 'Judgerbenchv2', 'subsets': [[name, metric] for name, metric in Judgerbenchv2_summary_names]}
|
||
|
]
|
||
|
|
||
|
|
||
|
summarizer = dict(
|
||
|
dataset_abbrs=[
|
||
|
'Judgerbenchv2'
|
||
|
],
|
||
|
summary_groups=Judgerbenchv2_summary_groups,
|
||
|
)
|