OpenCompass/configs/datasets/xiezhi/xiezhi_ppl_ea6bd7.py
2024-05-14 15:35:58 +08:00

50 lines
1.6 KiB
Python

from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import XiezhiDataset, XiezhiRetriever
xiezhi_datasets = []
for split in ['spec_eng', 'spec_chn', 'inter_eng', 'inter_chn']:
if 'chn' in split:
q_hint, a_hint = '题目', '答案'
else:
q_hint, a_hint = 'Question', 'Answer'
xiezhi_reader_cfg = dict(
input_columns=['question', 'A', 'B', 'C', 'D', 'labels'],
output_column='answer',
train_split='train',
test_split='test',
)
xiezhi_infer_cfg = dict(
ice_template=dict(
type=PromptTemplate,
template={
answer: dict(
begin='</E>',
round=[
dict(role='HUMAN', prompt=f'{q_hint}: {{question}}\nA. {{A}}\nB. {{B}}\nC. {{C}}\nD. {{D}}'),
dict(role='BOT', prompt=f'{a_hint}: {answer}'),
])
for answer in ['A', 'B', 'C', 'D']
},
ice_token='</E>',
),
retriever=dict(type=XiezhiRetriever, ice_num=3),
inferencer=dict(type=PPLInferencer),
)
xiezhi_eval_cfg = dict(evaluator=dict(type=AccEvaluator))
xiezhi_datasets.append(
dict(
type=XiezhiDataset,
abbr=f'xiezhi-{split}',
path='./data/xiezhi/',
name='xiezhi_' + split,
reader_cfg=xiezhi_reader_cfg,
infer_cfg=xiezhi_infer_cfg,
eval_cfg=xiezhi_eval_cfg,
))