OpenCompass/configs/summarizers/longbench.py
Fengzhe Zhou b4afe3e7c1
[Sync] Add InternLM2 Keyset Evaluation Demo (#807)
Co-authored-by: zhangyifan1 <zhangyifan1@pjlab.org.cn>
2024-01-17 13:48:12 +08:00

33 lines
1.2 KiB
Python

summarizer = dict(
dataset_abbrs = [
'--------- LongBench Single-Document QA ---------', # category
'LongBench_narrativeqa',
'LongBench_qasper',
'LongBench_multifieldqa_en',
'LongBench_multifieldqa_zh',
'--------- LongBench Multi-Document QA ---------', # category
'LongBench_hotpotqa',
'LongBench_2wikimqa',
'LongBench_musique',
'LongBench_dureader',
'--------- LongBench Summarization ---------', # category
'LongBench_gov_report',
'LongBench_qmsum',
'LongBench_multi_news',
'LongBench_vcsum',
'--------- LongBench Few-shot Learning ---------', # category
'LongBench_trec',
'LongBench_triviaqa',
'LongBench_samsum',
'LongBench_lsht',
'--------- LongBench Synthetic Tasks ---------', # category
'LongBench_passage_count',
'LongBench_passage_retrieval_en',
'LongBench_passage_retrieval_zh',
'--------- LongBench Code Completion ---------', # category
'LongBench_lcc',
'LongBench_repobench-p',
],
summary_groups=sum([v for k, v in locals().items() if k.endswith('_summary_groups')], []),
)