diff --git a/README.md b/README.md index 07dc610a..26a9fd4b 100644 --- a/README.md +++ b/README.md @@ -53,9 +53,7 @@ Just like a compass guides us on our journey, OpenCompass will guide you through 🔥🔥🔥 We are delighted to announce that **the OpenCompass has been recommended by the Meta AI**, click [Get Started](https://ai.meta.com/llama/get-started/#validation) of Llama for more information. > **Attention**
-> We launch the OpenCompass Collaboration project, welcome to support diverse evaluation benchmarks into OpenCompass! -> Clike [Issue](https://github.com/open-compass/opencompass/issues/248) for more information. -> Let's work together to build a more powerful OpenCompass toolkit! +> Breaking Change Notice: In version 0.4.0, we are consolidating all AMOTIC configuration files (previously located in ./configs/datasets, ./configs/models, and ./configs/summarizers) into the opencompass package. Users are advised to update their configuration references to reflect this structural change. ## 🚀 What's New diff --git a/README_zh-CN.md b/README_zh-CN.md index 8ac8cf3a..02f59284 100644 --- a/README_zh-CN.md +++ b/README_zh-CN.md @@ -53,9 +53,7 @@ 🔥🔥🔥 祝贺 **OpenCompass 作为大模型标准测试工具被Meta AI官方推荐**, 点击 Llama 的 [入门文档](https://ai.meta.com/llama/get-started/#validation) 获取更多信息。 > **注意**
-> 我们正式启动 OpenCompass 共建计划,诚邀社区用户为 OpenCompass 提供更具代表性和可信度的客观评测数据集! -> 点击 [Issue](https://github.com/open-compass/opencompass/issues/248) 获取更多数据集. -> 让我们携手共进,打造功能强大易用的大模型评测平台! +> 重要通知:从 v0.4.0 版本开始,所有位于 ./configs/datasets、./configs/models 和 ./configs/summarizers 目录下的 AMOTIC 配置文件将迁移至 opencompass 包中。请及时更新您的配置文件路径。 ## 🚀 最新进展 diff --git a/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py b/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py index 480eeadb..a1c7da8a 100644 --- a/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py +++ b/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py @@ -284,11 +284,12 @@ for _folder, _prompts in [ }, 'pred_role': 'BOT', } - _base_path = './data/GAOKAO-BENCH/data' + _base_path = 'opencompass/GAOKAO-BENCH' _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, diff --git a/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py b/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py index 637f4f51..15b9f3dd 100644 --- a/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py +++ b/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py @@ -288,7 +288,8 @@ for _folder, _prompts in [ _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, @@ -335,11 +336,12 @@ for _p in _MCQ_prompts: }, 'pred_role': 'BOT', } - _base_path = './data/GAOKAO-BENCH/data' + _base_path = 'opencompass/GAOKAO-BENCH' _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, diff --git a/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py b/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py index e3c251aa..e1bbdf7e 100644 --- a/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py +++ b/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py @@ -31,10 +31,12 @@ for folder, prompts in [ 'evaluator': {'type': 'GaokaoBenchEvaluator' + '_' + p['type']}, 'pred_role': 'BOT', } + _base_path = 'opencompass/GAOKAO-BENCH' dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + p['keyword'], - 'path': os.path.join('data', 'GAOKAO-BENCH', 'data', folder, p['keyword'] + '.json'), + 'path': _base_path, + 'filename': '/' + folder + '/' + p['keyword'] + '.json', 'name': p['keyword'], 'reader_cfg': reader_cfg, 'infer_cfg': infer_cfg, diff --git a/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py b/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py index 1f50030b..a561af9a 100644 --- a/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py +++ b/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py @@ -30,10 +30,12 @@ for folder, prompts in [ 'evaluator': {'type': 'GaokaoBenchEvaluator' + '_' + p['type']}, 'pred_role': 'BOT', } + _base_path = 'opencompass/GAOKAO-BENCH' dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + p['keyword'], - 'path': os.path.join('data', 'GAOKAO-BENCH', 'data', folder, p['keyword'] + '.json'), + 'path': _base_path, + 'filename': '/' + folder + '/' + p['keyword'] + '.json', 'name': p['keyword'], 'reader_cfg': reader_cfg, 'infer_cfg': infer_cfg, diff --git a/configs/datasets/nq/nq_open_1shot_gen_01cf41.py b/configs/datasets/nq/nq_open_1shot_gen_01cf41.py index ef15e81e..db67906b 100644 --- a/configs/datasets/nq/nq_open_1shot_gen_01cf41.py +++ b/configs/datasets/nq/nq_open_1shot_gen_01cf41.py @@ -54,7 +54,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/configs/datasets/nq/nq_open_1shot_gen_20a989.py b/configs/datasets/nq/nq_open_1shot_gen_20a989.py index 1df301f6..b1ac35ff 100644 --- a/configs/datasets/nq/nq_open_1shot_gen_20a989.py +++ b/configs/datasets/nq/nq_open_1shot_gen_20a989.py @@ -38,7 +38,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py b/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py index d676b949..e877b397 100644 --- a/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py +++ b/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py @@ -54,7 +54,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/configs/datasets/nq/nq_open_gen_e93f8a.py b/configs/datasets/nq/nq_open_gen_e93f8a.py index 224d9776..07d5b2a8 100644 --- a/configs/datasets/nq/nq_open_gen_e93f8a.py +++ b/configs/datasets/nq/nq_open_gen_e93f8a.py @@ -54,7 +54,7 @@ for k in [0, 1, 5, 25]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py b/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py index 0669bd7b..81056a4f 100644 --- a/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py +++ b/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py @@ -60,7 +60,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', diff --git a/configs/datasets/wikibench/wikibench_gen_0978ad.py b/configs/datasets/wikibench/wikibench_gen_0978ad.py index 871133f9..73d35f19 100644 --- a/configs/datasets/wikibench/wikibench_gen_0978ad.py +++ b/configs/datasets/wikibench/wikibench_gen_0978ad.py @@ -43,7 +43,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', reader_cfg=dict( diff --git a/configs/datasets/wikibench/wikibench_gen_f96ece.py b/configs/datasets/wikibench/wikibench_gen_f96ece.py index 5bf9d34e..80f03e5a 100644 --- a/configs/datasets/wikibench/wikibench_gen_f96ece.py +++ b/configs/datasets/wikibench/wikibench_gen_f96ece.py @@ -43,7 +43,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', reader_cfg=dict( diff --git a/opencompass/__init__.py b/opencompass/__init__.py index bfeb9e74..6e384829 100644 --- a/opencompass/__init__.py +++ b/opencompass/__init__.py @@ -1 +1,17 @@ __version__ = '0.3.4' + + +def _warn_about_config_migration(): + import warnings + warnings.warn( + 'Starting from v0.4.0, all AMOTIC configuration files currently ' + 'located in `./configs/datasets`, `./configs/models`, and ' + '`./configs/summarizers` will be migrated to the ' + '`opencompass/configs/` package. Please update your configuration ' + 'file paths accordingly.', + UserWarning, # Changed to UserWarning + stacklevel=2) + + +# Trigger the warning +_warn_about_config_migration() diff --git a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py index 480eeadb..a1c7da8a 100644 --- a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py +++ b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py @@ -284,11 +284,12 @@ for _folder, _prompts in [ }, 'pred_role': 'BOT', } - _base_path = './data/GAOKAO-BENCH/data' + _base_path = 'opencompass/GAOKAO-BENCH' _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, diff --git a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py index 637f4f51..15b9f3dd 100644 --- a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py +++ b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py @@ -288,7 +288,8 @@ for _folder, _prompts in [ _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, @@ -335,11 +336,12 @@ for _p in _MCQ_prompts: }, 'pred_role': 'BOT', } - _base_path = './data/GAOKAO-BENCH/data' + _base_path = 'opencompass/GAOKAO-BENCH' _dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + _p['keyword'], - 'path': _base_path + '/' + _folder + '/' + _p['keyword'] + '.json', + 'path': _base_path, + 'filename': '/' + _folder + '/' + _p['keyword'] + '.json', 'name': _p['keyword'], 'reader_cfg': _reader_cfg, 'infer_cfg': _infer_cfg, diff --git a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py index e3c251aa..e1bbdf7e 100644 --- a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py +++ b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py @@ -31,10 +31,12 @@ for folder, prompts in [ 'evaluator': {'type': 'GaokaoBenchEvaluator' + '_' + p['type']}, 'pred_role': 'BOT', } + _base_path = 'opencompass/GAOKAO-BENCH' dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + p['keyword'], - 'path': os.path.join('data', 'GAOKAO-BENCH', 'data', folder, p['keyword'] + '.json'), + 'path': _base_path, + 'filename': '/' + folder + '/' + p['keyword'] + '.json', 'name': p['keyword'], 'reader_cfg': reader_cfg, 'infer_cfg': infer_cfg, diff --git a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py index 1f50030b..a561af9a 100644 --- a/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py +++ b/opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py @@ -30,10 +30,12 @@ for folder, prompts in [ 'evaluator': {'type': 'GaokaoBenchEvaluator' + '_' + p['type']}, 'pred_role': 'BOT', } + _base_path = 'opencompass/GAOKAO-BENCH' dataset = { 'type': GaokaoBenchDataset, 'abbr': 'GaokaoBench_' + p['keyword'], - 'path': os.path.join('data', 'GAOKAO-BENCH', 'data', folder, p['keyword'] + '.json'), + 'path': _base_path, + 'filename': '/' + folder + '/' + p['keyword'] + '.json', 'name': p['keyword'], 'reader_cfg': reader_cfg, 'infer_cfg': infer_cfg, diff --git a/opencompass/configs/datasets/nq/nq_open_1shot_gen_01cf41.py b/opencompass/configs/datasets/nq/nq_open_1shot_gen_01cf41.py index ef15e81e..db67906b 100644 --- a/opencompass/configs/datasets/nq/nq_open_1shot_gen_01cf41.py +++ b/opencompass/configs/datasets/nq/nq_open_1shot_gen_01cf41.py @@ -54,7 +54,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/opencompass/configs/datasets/nq/nq_open_1shot_gen_20a989.py b/opencompass/configs/datasets/nq/nq_open_1shot_gen_20a989.py index 1df301f6..b1ac35ff 100644 --- a/opencompass/configs/datasets/nq/nq_open_1shot_gen_20a989.py +++ b/opencompass/configs/datasets/nq/nq_open_1shot_gen_20a989.py @@ -38,7 +38,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/opencompass/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py b/opencompass/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py index d676b949..e877b397 100644 --- a/opencompass/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py +++ b/opencompass/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py @@ -54,7 +54,7 @@ for k in [1]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/opencompass/configs/datasets/nq/nq_open_gen_e93f8a.py b/opencompass/configs/datasets/nq/nq_open_gen_e93f8a.py index 224d9776..07d5b2a8 100644 --- a/opencompass/configs/datasets/nq/nq_open_gen_e93f8a.py +++ b/opencompass/configs/datasets/nq/nq_open_gen_e93f8a.py @@ -54,7 +54,7 @@ for k in [0, 1, 5, 25]: dict( type=NQOpenDataset, abbr=f'nq_open_{k}shot', - path='./data/nq-open/', + path='opencompass/nq_open', reader_cfg=nq_reader_cfg, infer_cfg=nq_infer_cfg, eval_cfg=nq_eval_cfg) diff --git a/opencompass/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py b/opencompass/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py index 0669bd7b..81056a4f 100644 --- a/opencompass/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py +++ b/opencompass/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py @@ -60,7 +60,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', diff --git a/opencompass/configs/datasets/wikibench/wikibench_gen_0978ad.py b/opencompass/configs/datasets/wikibench/wikibench_gen_0978ad.py index 871133f9..73d35f19 100644 --- a/opencompass/configs/datasets/wikibench/wikibench_gen_0978ad.py +++ b/opencompass/configs/datasets/wikibench/wikibench_gen_0978ad.py @@ -43,7 +43,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', reader_cfg=dict( diff --git a/opencompass/configs/datasets/wikibench/wikibench_gen_f96ece.py b/opencompass/configs/datasets/wikibench/wikibench_gen_f96ece.py index 5bf9d34e..80f03e5a 100644 --- a/opencompass/configs/datasets/wikibench/wikibench_gen_f96ece.py +++ b/opencompass/configs/datasets/wikibench/wikibench_gen_f96ece.py @@ -43,7 +43,8 @@ for _split in list(wikibench_sets.keys()): wikibench_datasets.append( dict( type=WikiBenchDataset, - path=f'./data/WikiBench/{_name}.jsonl', + path='opencompass/WikiBench', + filename=f'{_name}.jsonl', name='circular_' + _name if do_circular else _name, abbr='wikibench-' + _split + '-' + _name + 'circular' if do_circular else '', reader_cfg=dict( diff --git a/opencompass/datasets/GaokaoBench.py b/opencompass/datasets/GaokaoBench.py index d3cd31a0..c1ae6d10 100644 --- a/opencompass/datasets/GaokaoBench.py +++ b/opencompass/datasets/GaokaoBench.py @@ -15,8 +15,10 @@ from .base import BaseDataset class GaokaoBenchDataset(BaseDataset): @staticmethod - def load(path: str, name: str): - path = get_data_path(path, local_mode=True) + def load(path: str, filename: str, name: str): + path = get_data_path(path) + path = path + filename + if environ.get('DATASET_SOURCE') == 'ModelScope': from modelscope import MsDataset return MsDataset.load(path, subset_name=name, split='test') diff --git a/opencompass/datasets/natural_question.py b/opencompass/datasets/natural_question.py index ab8356cd..e1ca1632 100644 --- a/opencompass/datasets/natural_question.py +++ b/opencompass/datasets/natural_question.py @@ -55,7 +55,7 @@ class NQOpenDataset(BaseDataset): @staticmethod def load(path: str): - path = get_data_path(path, local_mode=True) + path = get_data_path(path) dataset = DatasetDict() for split in ['validation', 'train']: filename = osp.join(path, f'nq-open-{split}.jsonl') diff --git a/opencompass/datasets/wikibench.py b/opencompass/datasets/wikibench.py index 9e0e5743..e2309999 100644 --- a/opencompass/datasets/wikibench.py +++ b/opencompass/datasets/wikibench.py @@ -21,8 +21,9 @@ def get_number(options): class WikiBenchDataset(BaseDataset): @staticmethod - def load(path: str, name: str): - path = get_data_path(path, local_mode=True) + def load(path: str, filename: str, name: str): + path = get_data_path(path) + path = path + filename circular_patterns = ['ABCD', 'BCDA', 'CDAB', 'DABC'] diff --git a/opencompass/utils/datasets_info.py b/opencompass/utils/datasets_info.py index 06555925..c877adf9 100644 --- a/opencompass/utils/datasets_info.py +++ b/opencompass/utils/datasets_info.py @@ -301,6 +301,21 @@ DATASETS_MAPPING = { "ms_id": "", "hf_id": "", "local": "./data/cmo.jsonl", + }, + "opencompass/nq_open": { + "ms_id": "", + "hf_id": "", + "local": "./data/nq-open/", + }, + "opencompass/GAOKAO-BENCH": { + "ms_id": "", + "hf_id": "", + "local": "./data/GAOKAO-BENCH/data", + }, + "opencompass/WikiBench": { + "ms_id": "", + "hf_id": "", + "local": "./data/WikiBench/", } } @@ -472,5 +487,25 @@ DATASETS_URL = { "/cmo": { "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/cmo.zip", "md5": "fad52c81290506a8ca74f46b5400d8fc" + }, + "/nq-open": { + "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/nq-open.zip", + "md5": "a340521e5c9ec591227dcb367f718b25", + }, + "/winogrande": { + "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/winogrande.zip", + "md5": "9e949a75eacc26ed4fd2b9aa870b495b", + }, + "/triviaqa": { + "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/triviaqa.zip", + "md5": "e6a118d744236814926b2ec7ec66c034", + }, + "/GAOKAO-BENCH": { + "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/GAOKAO-BENCH.zip", + "md5": "ba3c71b8b9db96d2a0664b977c4f9784", + }, + "/WikiBench": { + "url": "http://opencompass.oss-cn-shanghai.aliyuncs.com/datasets/data/WikiBench.zip", + "md5": "6dac1d1a3133fe1effff185cbf71d928", } }