OpenCompass/opencompass/datasets/longbench/longbench_vcsum.py
2024-09-06 15:50:12 +08:00

27 lines
855 B
Python

from datasets import Dataset, load_dataset
from opencompass.registry import LOAD_DATASET
from opencompass.utils import get_data_path
from ..base import BaseDataset
@LOAD_DATASET.register_module()
class LongBenchvcsumDataset(BaseDataset):
@staticmethod
def load(path: str, name: str):
path = get_data_path(path)
dataset = load_dataset(path=path,
name=name,
data_dir=path,
trust_remote_code=True)
split = 'test'
raw_data = []
for i in range(len(dataset[split])):
context = dataset[split]['context'][i]
answers = dataset[split]['answers'][i]
raw_data.append({'context': context, 'answers': answers})
dataset[split] = Dataset.from_list(raw_data)
return dataset