OpenCompass/configs/subjective/eval_subjective_compassarena.py
bittersweet1999 054e9fa7e5
[Feature] add one script for subjective (#993)
* add one script for subjective

* add one script for subjective

* add one script for subjective

* add one script for subjective

---------

Co-authored-by: thebestannie <1290646445@qq.com>
2024-03-20 23:20:41 +08:00

29 lines
913 B
Python

from os import getenv as gv
from opencompass.models import HuggingFaceCausalLM
from mmengine.config import read_base
with read_base():
from ..datasets.subjective.compassarena.compassarena_compare import subjective_datasets
from .model_cfg import models, judge_model, given_pred, infer, gpt4, runner
from opencompass.partitioners.sub_naive import SubjectiveNaivePartitioner
from opencompass.partitioners.sub_size import SubjectiveSizePartitioner
from opencompass.summarizers import CompassArenaSummarizer
datasets = [*subjective_datasets]
eval = dict(
partitioner=dict(
type=SubjectiveSizePartitioner,
strategy='split',
max_task_size=10000,
mode='m2n',
base_models=[gpt4],
compare_models=models,
),
runner=runner,
given_pred=given_pred
)
work_dir = 'outputs/compass_arena/'
summarizer = dict(type=CompassArenaSummarizer, summary_type='half_add')