mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
Update MathBench (#1176)
* Add Math Evaluation with Judge Model Evaluator * Add Math Evaluation with Judge Model Evaluator * Add Math Evaluation with Judge Model Evaluator * Add Math Evaluation with Judge Model Evaluator * Fix Llama-3 meta template * Fix MATH with JudgeLM Evaluation * Fix MATH with JudgeLM Evaluation * Fix MATH with JudgeLM Evaluation * Fix MATH with JudgeLM Evaluation * Update acclerator * Update MathBench --------- Co-authored-by: liuhongwei <liuhongwei@pjlab.org.cn>
This commit is contained in:
parent
2b3d4150f3
commit
1448be00e2
@ -91,7 +91,7 @@ for _split in list(mathbench_sets.keys()):
|
|||||||
),
|
),
|
||||||
),
|
),
|
||||||
retriever=dict(type=ZeroRetriever),
|
retriever=dict(type=ZeroRetriever),
|
||||||
inferencer=dict(type=GenInferencer, max_out_len=512),
|
inferencer=dict(type=GenInferencer, max_out_len=2048),
|
||||||
)
|
)
|
||||||
|
|
||||||
mathbench_eval_cfg = dict(
|
mathbench_eval_cfg = dict(
|
@ -1,4 +1,4 @@
|
|||||||
from mmengine.config import read_base
|
from mmengine.config import read_base
|
||||||
|
|
||||||
with read_base():
|
with read_base():
|
||||||
from .mathbench_2024_gen_649349 import mathbench_datasets # noqa: F401, F403
|
from .mathbench_2024_gen_19e486 import mathbench_datasets # noqa: F401, F403
|
||||||
|
Loading…
Reference in New Issue
Block a user