mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00

* add evaluation of scibench * add evaluation of scibench * update scibench * remove scibench evaluator --------- Co-authored-by: Leymore <zfz-960727@163.com>
7 lines
350 B
Python
7 lines
350 B
Python
scibench_summary_groups = []
|
|
|
|
scibench_tasks = ["atkins", "calculus", "chemmc", "class", "diff", "fund", "matter", "quan", "stat", "thermo"]
|
|
for suffix in ["", "_zs-cot", "_fs", "_fs-cot"]:
|
|
subsets = [f"scibench-{subset}{suffix}" for subset in scibench_tasks]
|
|
scibench_summary_groups.append({'name': f'scibench{suffix}', 'subsets': subsets})
|