diff --git a/opencompass/configs/datasets/livemathbench/livemathbench_hard_gen_353ae7.py b/opencompass/configs/datasets/livemathbench/livemathbench_hard_gen_353ae7.py index e932d3c3..6b2f9f5a 100644 --- a/opencompass/configs/datasets/livemathbench/livemathbench_hard_gen_353ae7.py +++ b/opencompass/configs/datasets/livemathbench/livemathbench_hard_gen_353ae7.py @@ -9,7 +9,7 @@ livemathbench_dataset = dict( type=LiveMathBenchDataset, path='', k=16, - replication=3, + n=48, dataset_splits=['hard'], dataset_languages=['cn', 'en'], cot=True, @@ -37,13 +37,7 @@ livemathbench_dataset = dict( evaluator=dict( type=LiveMathBenchEvaluator, model_name='', - url=[], - use_extract_model=False, - extract_url=[], - extract_model_name='', - k=[4, 8, 16], - replication=3, - thresholds=[0.0, 0.25, 0.5, 0.75, 1.0] + url=[] ) ) ) diff --git a/opencompass/configs/datasets/livemathbench/livemathbench_hard_greedy_gen_353ae7.py b/opencompass/configs/datasets/livemathbench/livemathbench_hard_greedy_gen_353ae7.py index 830e55af..f956f83e 100644 --- a/opencompass/configs/datasets/livemathbench/livemathbench_hard_greedy_gen_353ae7.py +++ b/opencompass/configs/datasets/livemathbench/livemathbench_hard_greedy_gen_353ae7.py @@ -9,7 +9,7 @@ livemathbench_dataset = dict( type=LiveMathBenchDataset, path='', k=1, - replication=1, + n=1, dataset_splits=['hard'], dataset_languages=['cn', 'en'], cot=True, @@ -37,13 +37,7 @@ livemathbench_dataset = dict( evaluator=dict( type=LiveMathBenchEvaluator, model_name='', - url=[], - use_extract_model=False, - extract_url=[], - extract_model_name='', - k=[1], - replication=1, - thresholds=[0.0] + url=[] ) ) )