mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00

* add compass arena * add compass_arena * add compass arena * Update opencompass/summarizers/subjective/compass_arena.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update opencompass/summarizers/subjective/__init__.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update opencompass/datasets/subjective/compass_arena.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update opencompass/datasets/subjective/__init__.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update configs/eval_subjective_compassarena.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update configs/datasets/subjective/compassarena/compassarena_compare.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update configs/eval_subjective_compassarena.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * Update configs/datasets/subjective/compassarena/compassarena_compare.py Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com> * fix check position bias --------- Co-authored-by: Songyang Zhang <tonysy@users.noreply.github.com>
29 lines
866 B
Python
29 lines
866 B
Python
from datasets import Dataset
|
|
|
|
from opencompass.registry import LOAD_DATASET
|
|
|
|
from .subjective_cmp import SubjectiveCmpDataset
|
|
|
|
|
|
@LOAD_DATASET.register_module()
|
|
class CompassArenaDataset(SubjectiveCmpDataset):
|
|
|
|
def load(
|
|
self,
|
|
path: str,
|
|
name: str,
|
|
):
|
|
dataset = list(super().load(path, name))
|
|
creation_dataset = []
|
|
for data in dataset:
|
|
if 'reference' in data['others']:
|
|
if data['others']['reference'] is not None:
|
|
data['ref'] = data['others']['reference']
|
|
else:
|
|
data['ref'] = '满足用户需求,言之有理即可'
|
|
else:
|
|
data['ref'] = '满足用户需求,言之有理即可'
|
|
creation_dataset.append(data)
|
|
dataset = Dataset.from_list(creation_dataset)
|
|
return dataset
|