from opencompass.openicl.icl_prompt_template import PromptTemplate from opencompass.openicl.icl_retriever import ZeroRetriever from opencompass.openicl.icl_inferencer import GenInferencer from opencompass.openicl.icl_evaluator import AccEvaluator from opencompass.utils.text_postprocessors import first_option_postprocess from opencompass.datasets.MedQA import MedQADataset QUERY_TEMPLATE = """ Answer the following multiple choice question. The last line of your response should be of the following format: 'ANSWER: $LETTER' (without quotes) where LETTER is one of Options(e.g. one of ABCDEFGHIJKLMNOP). Think step by step before answering. Question:\n {question} Options:\n {choices} """.strip() MedQA_datasets = [] MedQA_reader_cfg = dict( input_columns=['question', 'choices'], output_column='label', ) MedQA_infer_cfg = dict( prompt_template=dict( type=PromptTemplate, template=dict( round=[ dict(role='HUMAN', prompt=QUERY_TEMPLATE), ], ), ), retriever=dict(type=ZeroRetriever), inferencer=dict(type=GenInferencer), ) MedQA_subsets = { 'US': 'xuxuxuxuxu/MedQA_US_test', 'Mainland': 'xuxuxuxuxu/MedQA_Mainland_test', 'Taiwan': 'xuxuxuxuxu/MedQA_Taiwan_test', } for split in list(MedQA_subsets.keys()): MedQA_eval_cfg = dict( evaluator=dict(type=AccEvaluator), pred_postprocessor=dict(type=first_option_postprocess, options='ABCD') ) MedQA_datasets.append( dict( abbr=f'MedQA_{split}', type=MedQADataset, path=MedQA_subsets[split], reader_cfg=MedQA_reader_cfg, infer_cfg=MedQA_infer_cfg, eval_cfg=MedQA_eval_cfg, ) )