from opencompass.openicl.icl_prompt_template import PromptTemplate from opencompass.openicl.icl_retriever import ZeroRetriever from opencompass.openicl.icl_inferencer import GenInferencer from opencompass.datasets import HFDataset, HumanEvaluator, humaneval_postprocess humaneval_reader_cfg = dict( input_columns=['prompt'], output_column='task_id', train_split='test') # TODO: allow empty output-column humaneval_infer_cfg = dict( prompt_template=dict( type=PromptTemplate, template='{prompt}'), retriever=dict(type=ZeroRetriever), inferencer=dict(type=GenInferencer)) humaneval_eval_cfg = dict( evaluator=dict(type=HumanEvaluator), k=[1, 10, 100], # the parameter only for humaneval pred_postprocessor=dict(type=humaneval_postprocess), ) humaneval_datasets = [ dict( type=HFDataset, path='openai_humaneval', reader_cfg=humaneval_reader_cfg, infer_cfg=humaneval_infer_cfg, eval_cfg=humaneval_eval_cfg) ]