from opencompass.openicl.icl_prompt_template import PromptTemplate from opencompass.openicl.icl_retriever import ZeroRetriever from opencompass.openicl.icl_inferencer import GenInferencer from opencompass.datasets import HFDataset, HumanEvaluator humaneval_reader_cfg = dict( input_columns=['prompt'], output_column='task_id', train_split='test') # TODO: allow empty output-column humaneval_infer_cfg = dict( prompt_template=dict( type=PromptTemplate, template=dict( begin=[ dict( role='SYSTEM', fallback_role='HUMAN', prompt='Complete the following python code:'), ], round=[ dict(role='HUMAN', prompt='{prompt}'), ])), retriever=dict(type=ZeroRetriever), inferencer=dict(type=GenInferencer, max_out_len=512)) humaneval_eval_cfg = dict( evaluator=dict(type=HumanEvaluator), pred_role='BOT', k=[1, 10, 100], # the parameter only for humaneval pred_postprocessor=dict(type='humaneval'), ) humaneval_datasets = [ dict( type=HFDataset, path='openai_humaneval', reader_cfg=humaneval_reader_cfg, infer_cfg=humaneval_infer_cfg, eval_cfg=humaneval_eval_cfg) ]