2024-10-28 18:08:02 +08:00
|
|
|
import json
|
|
|
|
|
|
|
|
from datasets import Dataset
|
|
|
|
|
|
|
|
from opencompass.registry import LOAD_DATASET
|
|
|
|
from opencompass.utils import get_data_path
|
|
|
|
|
|
|
|
from .base import BaseDataset
|
|
|
|
|
|
|
|
|
|
|
|
@LOAD_DATASET.register_module()
|
|
|
|
class Aime2024Dataset(BaseDataset):
|
|
|
|
|
|
|
|
@staticmethod
|
2024-12-05 19:30:43 +08:00
|
|
|
def load(path, **kwargs):
|
2024-10-28 18:08:02 +08:00
|
|
|
path = get_data_path(path)
|
|
|
|
dataset = []
|
|
|
|
with open(path, 'r') as f:
|
|
|
|
for line in f:
|
|
|
|
line = json.loads(line)
|
|
|
|
origin_prompt = line['origin_prompt']
|
|
|
|
line['question'] = origin_prompt[:]
|
|
|
|
line['answer'] = line['gold_answer']
|
|
|
|
dataset.append(line)
|
|
|
|
return Dataset.from_list(dataset)
|