mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
[Update] Update dataset configs (#2030)
* [Update] Update dataset configs * Fix lint
This commit is contained in:
parent
c69110361b
commit
455bb05d1b
@ -86,7 +86,7 @@ for _name in chembench_all_sets:
|
|||||||
),
|
),
|
||||||
dataset_cfg=dict(
|
dataset_cfg=dict(
|
||||||
type=ChemBenchDataset,
|
type=ChemBenchDataset,
|
||||||
path='/fs-computility/llm/xiaolinchen/opencompass_fork/data/ChemBench4K',
|
path='opencompass/ChemBench4K',
|
||||||
name=_name,
|
name=_name,
|
||||||
reader_cfg=chembench_reader_cfg,
|
reader_cfg=chembench_reader_cfg,
|
||||||
),
|
),
|
||||||
|
@ -33,7 +33,12 @@ def extract_theoremqa_answer(pred: str, answer_flag: bool = True):
|
|||||||
try:
|
try:
|
||||||
with time_limit(1):
|
with time_limit(1):
|
||||||
tmp = str(latex2sympy(pred))
|
tmp = str(latex2sympy(pred))
|
||||||
pred = str(eval(tmp))
|
pred = eval(tmp)
|
||||||
|
if isinstance(pred, tuple):
|
||||||
|
pred = str(list(pred))
|
||||||
|
else:
|
||||||
|
pred = str(pred)
|
||||||
|
|
||||||
except Exception:
|
except Exception:
|
||||||
if re.match(r'-?[\d\.]+\s\D+$', pred):
|
if re.match(r'-?[\d\.]+\s\D+$', pred):
|
||||||
pred = pred.split(' ')[0]
|
pred = pred.split(' ')[0]
|
||||||
|
@ -14,6 +14,7 @@ from opencompass.utils import get_data_path
|
|||||||
|
|
||||||
from ..base import BaseDataset
|
from ..base import BaseDataset
|
||||||
|
|
||||||
|
|
||||||
@LOAD_DATASET.register_module()
|
@LOAD_DATASET.register_module()
|
||||||
class RewardBenchDataset(BaseDataset):
|
class RewardBenchDataset(BaseDataset):
|
||||||
|
|
||||||
|
@ -4,6 +4,7 @@ from collections import defaultdict
|
|||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
from datasets import Dataset, DatasetDict, load_dataset
|
from datasets import Dataset, DatasetDict, load_dataset
|
||||||
|
from nltk.translate.meteor_score import meteor_score
|
||||||
|
|
||||||
from opencompass.openicl.icl_evaluator.icl_base_evaluator import BaseEvaluator
|
from opencompass.openicl.icl_evaluator.icl_base_evaluator import BaseEvaluator
|
||||||
from opencompass.registry import (ICL_EVALUATORS, LOAD_DATASET,
|
from opencompass.registry import (ICL_EVALUATORS, LOAD_DATASET,
|
||||||
|
Loading…
Reference in New Issue
Block a user