2024-03-04 14:42:36 +08:00
|
|
|
from opencompass.openicl.icl_prompt_template import PromptTemplate
|
|
|
|
from opencompass.openicl.icl_retriever import FixKRetriever
|
|
|
|
from opencompass.openicl.icl_inferencer import PPLInferencer
|
2024-05-21 14:22:46 +08:00
|
|
|
from opencompass.openicl.icl_evaluator import AccwithDetailsEvaluator
|
2024-03-04 14:42:36 +08:00
|
|
|
from opencompass.datasets import CMMLUDataset
|
|
|
|
from opencompass.utils.text_postprocessors import first_capital_postprocess
|
|
|
|
|
|
|
|
cmmlu_subject_mapping = {
|
|
|
|
'agronomy': '农学',
|
|
|
|
'anatomy': '解剖学',
|
|
|
|
'ancient_chinese': '古汉语',
|
|
|
|
'arts': '艺术学',
|
|
|
|
'astronomy': '天文学',
|
|
|
|
'business_ethics': '商业伦理',
|
|
|
|
'chinese_civil_service_exam': '中国公务员考试',
|
|
|
|
'chinese_driving_rule': '中国驾驶规则',
|
|
|
|
'chinese_food_culture': '中国饮食文化',
|
|
|
|
'chinese_foreign_policy': '中国外交政策',
|
|
|
|
'chinese_history': '中国历史',
|
|
|
|
'chinese_literature': '中国文学',
|
|
|
|
'chinese_teacher_qualification': '中国教师资格',
|
|
|
|
'clinical_knowledge': '临床知识',
|
|
|
|
'college_actuarial_science': '大学精算学',
|
|
|
|
'college_education': '大学教育学',
|
|
|
|
'college_engineering_hydrology': '大学工程水文学',
|
|
|
|
'college_law': '大学法律',
|
|
|
|
'college_mathematics': '大学数学',
|
|
|
|
'college_medical_statistics': '大学医学统计',
|
|
|
|
'college_medicine': '大学医学',
|
|
|
|
'computer_science': '计算机科学',
|
|
|
|
'computer_security': '计算机安全',
|
|
|
|
'conceptual_physics': '概念物理学',
|
|
|
|
'construction_project_management': '建设工程管理',
|
|
|
|
'economics': '经济学',
|
|
|
|
'education': '教育学',
|
|
|
|
'electrical_engineering': '电气工程',
|
|
|
|
'elementary_chinese': '小学语文',
|
|
|
|
'elementary_commonsense': '小学常识',
|
|
|
|
'elementary_information_and_technology': '小学信息技术',
|
|
|
|
'elementary_mathematics': '初等数学',
|
|
|
|
'ethnology': '民族学',
|
|
|
|
'food_science': '食品科学',
|
|
|
|
'genetics': '遗传学',
|
|
|
|
'global_facts': '全球事实',
|
|
|
|
'high_school_biology': '高中生物',
|
|
|
|
'high_school_chemistry': '高中化学',
|
|
|
|
'high_school_geography': '高中地理',
|
|
|
|
'high_school_mathematics': '高中数学',
|
|
|
|
'high_school_physics': '高中物理学',
|
|
|
|
'high_school_politics': '高中政治',
|
|
|
|
'human_sexuality': '人类性行为',
|
|
|
|
'international_law': '国际法学',
|
|
|
|
'journalism': '新闻学',
|
|
|
|
'jurisprudence': '法理学',
|
|
|
|
'legal_and_moral_basis': '法律与道德基础',
|
|
|
|
'logical': '逻辑学',
|
|
|
|
'machine_learning': '机器学习',
|
|
|
|
'management': '管理学',
|
|
|
|
'marketing': '市场营销',
|
|
|
|
'marxist_theory': '马克思主义理论',
|
|
|
|
'modern_chinese': '现代汉语',
|
|
|
|
'nutrition': '营养学',
|
|
|
|
'philosophy': '哲学',
|
|
|
|
'professional_accounting': '专业会计',
|
|
|
|
'professional_law': '专业法学',
|
|
|
|
'professional_medicine': '专业医学',
|
|
|
|
'professional_psychology': '专业心理学',
|
|
|
|
'public_relations': '公共关系',
|
|
|
|
'security_study': '安全研究',
|
|
|
|
'sociology': '社会学',
|
|
|
|
'sports_science': '体育学',
|
|
|
|
'traditional_chinese_medicine': '中医中药',
|
|
|
|
'virology': '病毒学',
|
|
|
|
'world_history': '世界历史',
|
|
|
|
'world_religions': '世界宗教'
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
cmmlu_all_sets = list(cmmlu_subject_mapping.keys())
|
|
|
|
|
|
|
|
cmmlu_datasets = []
|
|
|
|
for _name in cmmlu_all_sets:
|
|
|
|
_ch_name = cmmlu_subject_mapping[_name]
|
2024-05-14 15:35:58 +08:00
|
|
|
hint = f'以下是关于{_ch_name}的单项选择题,请直接给出正确答案的选项。'
|
|
|
|
question_and_options = '题目:{question}\nA. {A}\nB. {B}\nC. {C}\nD. {D}'
|
2024-03-04 14:42:36 +08:00
|
|
|
cmmlu_infer_cfg = dict(
|
|
|
|
ice_template=dict(
|
|
|
|
type=PromptTemplate,
|
2024-05-14 15:35:58 +08:00
|
|
|
template={answer: f'{question_and_options}\n答案是: {answer}\n' for answer in ['A', 'B', 'C', 'D']},
|
2024-03-04 14:42:36 +08:00
|
|
|
),
|
|
|
|
prompt_template=dict(
|
|
|
|
type=PromptTemplate,
|
2024-05-14 15:35:58 +08:00
|
|
|
template={answer: f'{hint}\n</E>{question_and_options}\n答案是: {answer}' for answer in ['A', 'B', 'C', 'D']},
|
|
|
|
ice_token='</E>',
|
2024-03-04 14:42:36 +08:00
|
|
|
),
|
|
|
|
retriever=dict(type=FixKRetriever, fix_id_list=[0, 1, 2, 3, 4]),
|
|
|
|
inferencer=dict(type=PPLInferencer),
|
|
|
|
)
|
|
|
|
|
2024-05-21 14:22:46 +08:00
|
|
|
cmmlu_eval_cfg = dict(evaluator=dict(type=AccwithDetailsEvaluator))
|
2024-03-04 14:42:36 +08:00
|
|
|
|
|
|
|
cmmlu_datasets.append(
|
|
|
|
dict(
|
|
|
|
type=CMMLUDataset,
|
2024-05-14 15:35:58 +08:00
|
|
|
path='./data/cmmlu/',
|
2024-03-04 14:42:36 +08:00
|
|
|
name=_name,
|
2024-05-14 15:35:58 +08:00
|
|
|
abbr=f'cmmlu-{_name}',
|
2024-03-04 14:42:36 +08:00
|
|
|
reader_cfg=dict(
|
2024-05-14 15:35:58 +08:00
|
|
|
input_columns=['question', 'A', 'B', 'C', 'D'],
|
|
|
|
output_column='answer',
|
|
|
|
train_split='dev',
|
2024-03-04 14:42:36 +08:00
|
|
|
test_split='test'),
|
|
|
|
infer_cfg=cmmlu_infer_cfg,
|
|
|
|
eval_cfg=cmmlu_eval_cfg,
|
|
|
|
))
|
|
|
|
|
|
|
|
del _name, _ch_name
|