diff --git a/configs/subjective_score.py b/configs/subjective_score.py index a79b8e59..ac1f0de5 100644 --- a/configs/subjective_score.py +++ b/configs/subjective_score.py @@ -49,7 +49,7 @@ _meta_template = dict( ) -judge_model = dict( +judge_model = dict( type=HuggingFaceCausalLM, abbr='qwen-7b-chat-hf', path="Qwen/Qwen-7B-Chat", @@ -85,6 +85,7 @@ eval = dict( max_num_workers=256, task=dict( type=SubjectiveEvalTask, + judge_cfg=judge_model )), ) work_dir = './creation/' diff --git a/opencompass/partitioners/sub_naive.py b/opencompass/partitioners/sub_naive.py index 6a6cf8bb..e21193b0 100644 --- a/opencompass/partitioners/sub_naive.py +++ b/opencompass/partitioners/sub_naive.py @@ -102,8 +102,9 @@ class SubjectiveNaivePartitioner(NaivePartitioner): else: models = self.get_model_combinations(models, base_models, compare_models) - return super().partition(models=models, - datasets=datasets, - work_dir=work_dir, - out_dir=out_dir, - add_cfg=add_cfg) + model_dataset_combinations = [{'models': models, 'datasets': datasets}] + return super().partition( + model_dataset_combinations=model_dataset_combinations, + work_dir=work_dir, + out_dir=out_dir, + add_cfg=add_cfg)