mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
[Update] Update dataset configs (#2030)
* [Update] Update dataset configs * Fix lint
This commit is contained in:
parent
c69110361b
commit
455bb05d1b
@ -86,7 +86,7 @@ for _name in chembench_all_sets:
|
||||
),
|
||||
dataset_cfg=dict(
|
||||
type=ChemBenchDataset,
|
||||
path='/fs-computility/llm/xiaolinchen/opencompass_fork/data/ChemBench4K',
|
||||
path='opencompass/ChemBench4K',
|
||||
name=_name,
|
||||
reader_cfg=chembench_reader_cfg,
|
||||
),
|
||||
|
@ -33,7 +33,12 @@ def extract_theoremqa_answer(pred: str, answer_flag: bool = True):
|
||||
try:
|
||||
with time_limit(1):
|
||||
tmp = str(latex2sympy(pred))
|
||||
pred = str(eval(tmp))
|
||||
pred = eval(tmp)
|
||||
if isinstance(pred, tuple):
|
||||
pred = str(list(pred))
|
||||
else:
|
||||
pred = str(pred)
|
||||
|
||||
except Exception:
|
||||
if re.match(r'-?[\d\.]+\s\D+$', pred):
|
||||
pred = pred.split(' ')[0]
|
||||
|
@ -14,6 +14,7 @@ from opencompass.utils import get_data_path
|
||||
|
||||
from ..base import BaseDataset
|
||||
|
||||
|
||||
@LOAD_DATASET.register_module()
|
||||
class RewardBenchDataset(BaseDataset):
|
||||
|
||||
|
@ -4,6 +4,7 @@ from collections import defaultdict
|
||||
|
||||
import numpy as np
|
||||
from datasets import Dataset, DatasetDict, load_dataset
|
||||
from nltk.translate.meteor_score import meteor_score
|
||||
|
||||
from opencompass.openicl.icl_evaluator.icl_base_evaluator import BaseEvaluator
|
||||
from opencompass.registry import (ICL_EVALUATORS, LOAD_DATASET,
|
||||
|
Loading…
Reference in New Issue
Block a user