From 214a34f0b87aabb4164e958ceded4435ca2e830f Mon Sep 17 00:00:00 2001 From: liushz Date: Mon, 6 Nov 2023 21:58:31 +0800 Subject: [PATCH] =?UTF-8?q?=E3=80=90Feature=E3=80=91Update=20Mathbench=20d?= =?UTF-8?q?ataset=20prompt=20and=20fix=20small=20errors=20(#546)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * Update mathbench * Update mathbench * Update mathbench --- configs/datasets/MathBench/mathbench_gen.py | 2 +- ...thbench_gen_86de1c.py => mathbench_gen_51000f.py} | 12 ++++++------ 2 files changed, 7 insertions(+), 7 deletions(-) rename configs/datasets/MathBench/{mathbench_gen_86de1c.py => mathbench_gen_51000f.py} (95%) diff --git a/configs/datasets/MathBench/mathbench_gen.py b/configs/datasets/MathBench/mathbench_gen.py index 81a068f2..208d2359 100644 --- a/configs/datasets/MathBench/mathbench_gen.py +++ b/configs/datasets/MathBench/mathbench_gen.py @@ -1,4 +1,4 @@ from mmengine.config import read_base with read_base(): - from .mathbench_gen_86de1c import mathbench_datasets # noqa: F401, F403 + from .mathbench_gen_51000f import mathbench_datasets # noqa: F401, F403 diff --git a/configs/datasets/MathBench/mathbench_gen_86de1c.py b/configs/datasets/MathBench/mathbench_gen_51000f.py similarity index 95% rename from configs/datasets/MathBench/mathbench_gen_86de1c.py rename to configs/datasets/MathBench/mathbench_gen_51000f.py index 1c350e9d..b456a9ef 100644 --- a/configs/datasets/MathBench/mathbench_gen_86de1c.py +++ b/configs/datasets/MathBench/mathbench_gen_51000f.py @@ -8,12 +8,12 @@ from opencompass.utils.text_postprocessors import first_capital_postprocess single_choice_prompts = { "single_choice_cn_with_reasoning": "以下是一道关于数学的单项选择题,请你一步一步推理并得到最终的答案选项。回答格式为如下:\n答案选项:A、B、C、D中你认为正确的一个选项\n计算过程:根据题目得到选项答案的一步步过程\n请严格按照上面的格式回答问题,下面是你要回答的题目:\n{question}\n答案选项:", - "single_choice_cn": "以下是一道关于数学的单项选择题,请你直接给出正确的答案选项。回答格式为如下:\n答案选项:A、B、C、D中你认为正确的选项\n下面是你要回答的题目:\n{question}\n答案选项:", + "single_choice_cn": "以下是一道关于数学的单项选择题,请你给出正确的答案选项。\n下面是你要回答的题目:\n{question}\n答案选项:", "single_choice_en_with_reasoning": "Here is a multiple-choice question about mathematics. Please provide the final answer option by step-by-step reasoning. Please answer in the following format:\nAnswer option: A, B, C, or D (the option you believe is correct)\nCalculation process: Step-by-step process to derive the answer option based on the question\nPlease strictly follow the above format to answer the question. Here is the question you need to answer:\n{question}\nAnswer option:", - "single_choice_en": "Here is a multiple-choice question about mathematics. Please provide the correct answer option directly. Please answer in the following format:\nAnswer option: A, B, C, or D (the option you believe is correct)\nHere is the question you need to answer:\n{question}\nAnswer option:", + "single_choice_en": "Here is a multiple-choice question about mathematics. Please provide the correct answer option directly.\nHere is the question you need to answer:\n{question}\nAnswer option:", } -cloze_prompts ={ +cloze_prompts={ "cloze_cn": [ dict(role='HUMAN', prompt='Q: 林中有15棵树。林务工人员今天将在林中种植树木。完成后,将有21棵树。林务工人员今天种植了多少棵树?'), dict(role='BOT', prompt='A: 我们从15棵树开始。后来有21棵树。差值必定是他们种植的树木数量。所以,他们必须种植了21 - 15 = 6棵树。答案是 6\n'), @@ -61,16 +61,15 @@ mathbench_sets = { 'college': ['single_choice_cn', 'cloze_en'], 'high': ['single_choice_cn', 'single_choice_en'], 'middle': ['single_choice_cn'], - 'primary': ['single_choice_cn', 'cloze_cn'], + 'primary': ['cloze_cn'], } # Generate reasoning path if set True or just generate the final answer -with_reasoning = True +with_reasoning = False # Use circular evaluation or not with_circular_eval = True - mathbench_datasets = [] for _split in list(mathbench_sets.keys()): @@ -102,6 +101,7 @@ for _split in list(mathbench_sets.keys()): type=MathBenchDataset, path=f"./data/mathbench/{_split}", name=_name, + with_circular=with_circular_eval, abbr="mathbench-" + _split + '-' + _name, reader_cfg=dict( input_columns=["question"],