from mmengine.config import read_base from opencompass.openicl.icl_prompt_template import PromptTemplate from opencompass.openicl.icl_retriever import ZeroRetriever from opencompass.openicl.icl_inferencer import GenInferencer from opencompass.openicl.icl_evaluator import AccEvaluator from opencompass.datasets import MMLUDataset from opencompass.utils.text_postprocessors import match_answer_pattern with read_base(): from .mmlu_all_sets import mmlu_all_sets # None of the mmlu dataset in huggingface is correctly parsed, so we use our own dataset reader # Please download the dataset from https://people.eecs.berkeley.edu/~hendrycks/data.tar QUERY_TEMPLATE = """ Answer the following multiple choice question. The last line of your response should be of the following format: 'ANSWER: $LETTER' (without quotes) where LETTER is one of ABCD. Think step by step before answering. {input} A) {A} B) {B} C) {C} D) {D} """.strip() mmlu_reader_cfg = dict( input_columns=["input", "A", "B", "C", "D"], output_column="target", train_split='dev') mmlu_datasets = [] for name in mmlu_all_sets: mmlu_infer_cfg = dict( prompt_template=dict( type=PromptTemplate, template=dict( round=[ dict(role="HUMAN", prompt=QUERY_TEMPLATE), ], ), ), retriever=dict(type=ZeroRetriever), inferencer=dict(type=GenInferencer), ) mmlu_eval_cfg = dict( evaluator=dict(type=AccEvaluator), pred_postprocessor=dict(type=match_answer_pattern, answer_pattern=r"(?i)ANSWER\s*:\s*([A-D])")) mmlu_datasets.append( dict( abbr=f"lukaemon_mmlu_{name}", type=MMLUDataset, path="./data/mmlu/", name=name, reader_cfg=mmlu_reader_cfg, infer_cfg=mmlu_infer_cfg, eval_cfg=mmlu_eval_cfg, ))