[Feature] Add new dataset mastermath2024v1 (#744)

* add new dataset mastermath2024v1 * change it to simplified chinese prompt * change file name
2025-05-30 16:03:24 +08:00 · 2024-01-01 15:53:24 +08:00 · 2024-01-01 15:53:24 +08:00 · ef3ae63539
commit ef3ae63539
parent 17b8e929dd
4 changed files with 105 additions and 0 deletions
--- a/configs/datasets/mastermath2024v1/mastermath2024v1_gen.py
+++ b/configs/datasets/mastermath2024v1/mastermath2024v1_gen.py
@ -0,0 +1,4 @@
 from mmengine.config import read_base
 with read_base():
    from .mastermath2024v1_gen_be6318 import mastermath2024v1_datasets
--- a/configs/datasets/mastermath2024v1/mastermath2024v1_gen_be6318.py
+++ b/configs/datasets/mastermath2024v1/mastermath2024v1_gen_be6318.py
@ -0,0 +1,37 @@
 from opencompass.openicl.icl_prompt_template import PromptTemplate
 from opencompass.openicl.icl_retriever import ZeroRetriever
 from opencompass.openicl.icl_inferencer import GenInferencer
 from opencompass.datasets import MastermathDatasetv1, MastermathDatasetv1Evaluator
 from opencompass.utils import first_option_postprocess
 mastermath2024v1_reader_cfg = dict(
    input_columns=['question', 'A', 'B', 'C', 'D'],
    output_column='answer')
 mastermath2024v1_infer_cfg = dict(
    prompt_template=dict(
        type=PromptTemplate,
        template=dict(
            round=[
                dict(role='HUMAN', prompt='{question}\n选项:\n'
                                          '(A){A}\n'
                                          '(B){B}\n'
                                          '(C){C}\n'
                                          '(D){D}\n'
                                          '你的回答格式如下: "正确答案是 (在这里插入你的答案)"'),
            ], )),
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=GenInferencer))
 mastermath2024v1_eval_cfg = dict(evaluator=dict(type=MastermathDatasetv1Evaluator),
                                 pred_postprocessor=dict(type=first_option_postprocess, options='ABCD'))
 mastermath2024v1_datasets = [dict(
        abbr='Mastermath2024v1',
        type=MastermathDatasetv1,
        path='./data/mastermath2024v1/',
        name='kaoyan_math_1_mcq_Sheet1.csv',
        reader_cfg=mastermath2024v1_reader_cfg,
        infer_cfg=mastermath2024v1_infer_cfg,
        eval_cfg=mastermath2024v1_eval_cfg)]
--- a/opencompass/datasets/init.py
+++ b/opencompass/datasets/init.py
@ -54,6 +54,7 @@ from .lawbench import *  # noqa: F401, F403
 from .lcsts import *  # noqa: F401, F403
 from .leval import *  # noqa: F401, F403
 from .longbench import *  # noqa: F401, F403
 from .mastermath2024v1 import *  # noqa: F401, F403
 from .math import *  # noqa: F401, F403
 from .mathbench import *  # noqa: F401, F403
 from .mbpp import *  # noqa: F401, F403
--- a/opencompass/datasets/mastermath2024v1.py
+++ b/opencompass/datasets/mastermath2024v1.py
@ -0,0 +1,63 @@
 import csv
 import os
 from datasets import Dataset
 from opencompass.openicl import BaseEvaluator
 from opencompass.registry import LOAD_DATASET
 from .base import BaseDataset
@LOAD_DATASET.register_module()
 class MastermathDatasetv1(BaseDataset):
    @staticmethod
    def load(path: str, name: str):
        cnt = 0
        data = []
        with open(os.path.join(path, name), 'r', encoding='utf-8') as f:
            reader = csv.reader(f, delimiter=',')
            for row in reader:
                if row[1] == 'question':
                    continue
                cnt = cnt + 1
                question = row[1]
                A = row[2]
                B = row[3]
                C = row[4]
                D = row[5]
                answer = row[6]
                data.append({
                    'question': question,
                    'A': A,
                    'B': B,
                    'C': C,
                    'D': D,
                    'answer': answer,
                })
        dataset = Dataset.from_list(data)
        return dataset
 class MastermathDatasetv1Evaluator(BaseEvaluator):
    def score(self, predictions, references):
        if len(predictions) != len(references):
            return {
                'error': 'predictions and references have different length'
            }
        correct = 0
        count = 0
        details = []
        for i, j in zip(predictions, references):
            detail = {'pred': i, 'answer': j, 'correct': False}
            count += 1
            if i == j:
                correct += 1
                detail['correct'] = True
            details.append(detail)
        result = {'accuracy': 100 * correct / count, 'details': details}
        return result