2023-08-16 18:42:06 +08:00
|
|
|
from .advglue import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .afqmcd import * # noqa: F401, F403
|
|
|
|
from .agieval import * # noqa: F401, F403
|
2024-10-28 18:08:02 +08:00
|
|
|
from .aime2024 import * # noqa: F401, F403
|
2023-08-10 14:04:18 +08:00
|
|
|
from .anli import AnliDataset # noqa: F401, F403
|
2023-09-20 18:36:44 +08:00
|
|
|
from .anthropics_evals import * # noqa: F401, F403
|
2024-04-09 17:50:23 +08:00
|
|
|
from .apps import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .arc import * # noqa: F401, F403
|
2024-12-02 11:42:07 +08:00
|
|
|
from .arc_prize_public_evaluation import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .ax import * # noqa: F401, F403
|
2024-11-14 15:32:43 +08:00
|
|
|
from .babilong import * # noqa: F401, F403
|
2025-03-12 10:53:31 +08:00
|
|
|
from .bbeh import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .bbh import * # noqa: F401, F403
|
2024-12-05 19:30:43 +08:00
|
|
|
from .bigcodebench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .boolq import * # noqa: F401, F403
|
|
|
|
from .bustum import * # noqa: F401, F403
|
|
|
|
from .c3 import * # noqa: F401, F403
|
2024-08-01 10:03:21 +08:00
|
|
|
from .calm import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .cb import * # noqa: F401, F403
|
|
|
|
from .ceval import * # noqa: F401, F403
|
2024-05-27 13:48:22 +08:00
|
|
|
from .charm import * # noqa: F401, F403
|
2024-04-12 08:46:26 +08:00
|
|
|
from .chembench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .chid import * # noqa: F401, F403
|
2024-12-11 18:03:39 +08:00
|
|
|
from .chinese_simpleqa import * # noqa: F401, F403
|
2023-11-07 19:11:44 +08:00
|
|
|
from .cibench import * # noqa: F401, F403
|
2023-11-23 16:45:47 +08:00
|
|
|
from .circular import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .civilcomments import * # noqa: F401, F403
|
2023-11-09 22:05:25 +08:00
|
|
|
from .clozeTest_maxmin import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .cluewsc import * # noqa: F401, F403
|
2023-09-12 19:16:41 +08:00
|
|
|
from .cmb import * # noqa: F401, F403
|
2023-07-25 10:14:27 +08:00
|
|
|
from .cmmlu import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .cmnli import * # noqa: F401, F403
|
2024-10-28 18:08:02 +08:00
|
|
|
from .cmo_fib import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .cmrc import * # noqa: F401, F403
|
|
|
|
from .commonsenseqa import * # noqa: F401, F403
|
2023-11-30 15:33:02 +08:00
|
|
|
from .commonsenseqa_cn import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .copa import * # noqa: F401, F403
|
|
|
|
from .crowspairs import * # noqa: F401, F403
|
2023-11-30 15:33:02 +08:00
|
|
|
from .crowspairs_cn import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .csl import * # noqa: F401, F403
|
2023-12-25 21:59:16 +08:00
|
|
|
from .custom import * # noqa: F401, F403
|
2023-07-18 18:45:15 +08:00
|
|
|
from .cvalues import * # noqa: F401, F403
|
2024-09-29 19:24:58 +08:00
|
|
|
from .dingo import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .drcd import * # noqa: F401, F403
|
|
|
|
from .drop import * # noqa: F401, F403
|
2024-05-06 13:37:08 +08:00
|
|
|
from .drop_simple_eval import * # noqa: F401, F403
|
2023-09-15 12:50:27 +08:00
|
|
|
from .ds1000 import * # noqa: F401, F403
|
2023-11-07 19:11:44 +08:00
|
|
|
from .ds1000_interpreter import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .eprstmt import * # noqa: F401, F403
|
2023-11-16 17:47:57 +08:00
|
|
|
from .FinanceIQ import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .flores import * # noqa: F401, F403
|
2023-08-23 12:23:05 +08:00
|
|
|
from .game24 import * # noqa: F401, F403
|
2024-10-12 19:13:06 +08:00
|
|
|
from .gaokao_math import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .GaokaoBench import * # noqa: F401, F403
|
2024-12-05 19:30:43 +08:00
|
|
|
from .generic import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .govrepcrs import * # noqa: F401, F403
|
2024-01-01 15:54:40 +08:00
|
|
|
from .gpqa import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .gsm8k import * # noqa: F401, F403
|
2023-11-27 17:40:34 +08:00
|
|
|
from .gsm_hard import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .hellaswag import * # noqa: F401, F403
|
2025-03-04 16:42:37 +08:00
|
|
|
from .hle import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .huggingface import * # noqa: F401, F403
|
|
|
|
from .humaneval import * # noqa: F401, F403
|
[Feature] Support ModelScope datasets (#1289)
* add ceval, gsm8k modelscope surpport
* update race, mmlu, arc, cmmlu, commonsenseqa, humaneval and unittest
* update bbh, flores, obqa, siqa, storycloze, summedits, winogrande, xsum datasets
* format file
* format file
* update dataset format
* support ms_dataset
* udpate dataset for modelscope support
* merge myl_dev and update test_ms_dataset
* udpate dataset for modelscope support
* update readme
* update eval_api_zhipu_v2
* remove unused code
* add get_data_path function
* update readme
* remove tydiqa japanese subset
* add ceval, gsm8k modelscope surpport
* update race, mmlu, arc, cmmlu, commonsenseqa, humaneval and unittest
* update bbh, flores, obqa, siqa, storycloze, summedits, winogrande, xsum datasets
* format file
* format file
* update dataset format
* support ms_dataset
* udpate dataset for modelscope support
* merge myl_dev and update test_ms_dataset
* update readme
* udpate dataset for modelscope support
* update eval_api_zhipu_v2
* remove unused code
* add get_data_path function
* remove tydiqa japanese subset
* update util
* remove .DS_Store
* fix md format
* move util into package
* update docs/get_started.md
* restore eval_api_zhipu_v2.py, add environment setting
* Update dataset
* Update
* Update
* Update
* Update
---------
Co-authored-by: Yun lin <yunlin@U-Q9X2K4QV-1904.local>
Co-authored-by: Yunnglin <mao.looper@qq.com>
Co-authored-by: Yun lin <yunlin@laptop.local>
Co-authored-by: Yunnglin <maoyl@smail.nju.edu.cn>
Co-authored-by: zhangsongyang <zhangsongyang@pjlab.org.cn>
2024-07-29 13:48:32 +08:00
|
|
|
from .humaneval_multi import * # noqa: F401, F403
|
2023-08-17 11:03:16 +08:00
|
|
|
from .humanevalx import * # noqa: F401, F403
|
2024-01-08 22:07:24 +08:00
|
|
|
from .hungarian_math import * # noqa: F401, F403
|
2024-02-22 16:51:34 +08:00
|
|
|
from .IFEval.ifeval import IFEvalDataset, IFEvaluator # noqa: F401, F403
|
2024-07-22 17:59:30 +08:00
|
|
|
from .inference_ppl import InferencePPLDataset # noqa: F401, F403
|
2023-12-26 15:36:27 +08:00
|
|
|
from .infinitebench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .iwslt2017 import * # noqa: F401, F403
|
|
|
|
from .jigsawmultilingual import * # noqa: F401, F403
|
2024-01-08 22:07:24 +08:00
|
|
|
from .jsonl import JsonlDataset # noqa: F401, F403
|
2023-09-22 18:46:33 +08:00
|
|
|
from .kaoshi import KaoshiDataset, KaoshiEvaluator # noqa: F401, F403
|
2024-11-25 20:11:27 +08:00
|
|
|
from .korbench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .lambada import * # noqa: F401, F403
|
2023-10-13 19:51:36 +08:00
|
|
|
from .lawbench import * # noqa: F401, F403
|
2024-07-29 18:32:50 +08:00
|
|
|
from .LCBench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .lcsts import * # noqa: F401, F403
|
2023-08-25 11:46:23 +08:00
|
|
|
from .leval import * # noqa: F401, F403
|
2024-10-21 20:50:39 +08:00
|
|
|
from .livecodebench import * # noqa: F401, F403
|
2024-12-05 19:30:43 +08:00
|
|
|
from .livemathbench import * # noqa: F401, F403
|
|
|
|
from .livereasonbench import * # noqa: F401, F403
|
2024-12-31 15:17:39 +08:00
|
|
|
from .livestembench import * # noqa: F401, F403
|
2024-04-30 10:51:01 +08:00
|
|
|
from .llm_compression import LLMCompressionDataset # noqa: F401, F403
|
2023-08-21 14:15:20 +08:00
|
|
|
from .longbench import * # noqa: F401, F403
|
2025-01-03 12:04:29 +08:00
|
|
|
from .longbenchv2 import * # noqa: F401, F403
|
2024-03-04 11:22:03 +08:00
|
|
|
from .lveval import * # noqa: F401, F403
|
2024-01-01 15:53:24 +08:00
|
|
|
from .mastermath2024v1 import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .math import * # noqa: F401, F403
|
2024-01-08 22:07:24 +08:00
|
|
|
from .math401 import * # noqa: F401, F403
|
2024-01-24 16:30:32 +08:00
|
|
|
from .math_intern import * # noqa: F401, F403
|
2023-10-18 17:08:31 +08:00
|
|
|
from .mathbench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .mbpp import * # noqa: F401, F403
|
2023-12-09 16:05:46 +08:00
|
|
|
from .medbench import * # noqa: F401, F403
|
2024-05-06 15:29:34 +08:00
|
|
|
from .mgsm import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .mmlu import * # noqa: F401, F403
|
2025-01-09 14:11:20 +08:00
|
|
|
from .mmlu_cf import * # noqa: F401, F403
|
2024-06-28 14:16:34 +08:00
|
|
|
from .mmlu_pro import * # noqa: F401, F403
|
2024-05-08 15:13:18 +08:00
|
|
|
from .MMLUArabic import * # noqa: F401, F403
|
2024-10-17 19:09:34 +08:00
|
|
|
from .mmmlu import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .multirc import * # noqa: F401, F403
|
2024-11-14 20:42:12 +08:00
|
|
|
from .musr import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .narrativeqa import * # noqa: F401, F403
|
|
|
|
from .natural_question import * # noqa: F401, F403
|
2023-11-30 15:33:02 +08:00
|
|
|
from .natural_question_cn import * # noqa: F401, F403
|
2024-02-05 15:52:28 +08:00
|
|
|
from .NPHardEval import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .obqa import * # noqa: F401, F403
|
2025-01-24 10:00:01 +08:00
|
|
|
from .OlympiadBench import * # noqa: F401, F403
|
2024-02-29 12:55:07 +08:00
|
|
|
from .OpenFinData import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .piqa import * # noqa: F401, F403
|
2023-11-09 22:05:25 +08:00
|
|
|
from .py150 import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .qasper import * # noqa: F401, F403
|
|
|
|
from .qaspercut import * # noqa: F401, F403
|
2024-03-15 21:22:38 +08:00
|
|
|
from .QuALITY import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .race import * # noqa: F401, F403
|
|
|
|
from .realtoxicprompts import * # noqa: F401, F403
|
2023-12-20 17:57:42 +08:00
|
|
|
from .reasonbench import ReasonBenchDataset # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .record import * # noqa: F401, F403
|
2024-08-20 11:40:11 +08:00
|
|
|
from .ruler import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .safety import * # noqa: F401, F403
|
2023-09-22 17:42:08 +08:00
|
|
|
from .scibench import ScibenchDataset, scibench_postprocess # noqa: F401, F403
|
2024-08-22 13:42:25 +08:00
|
|
|
from .scicode import * # noqa: F401, F403
|
2024-11-28 19:16:07 +08:00
|
|
|
from .simpleqa import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .siqa import * # noqa: F401, F403
|
2023-08-10 14:04:18 +08:00
|
|
|
from .squad20 import SQuAD20Dataset, SQuAD20Evaluator # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .storycloze import * # noqa: F401, F403
|
|
|
|
from .strategyqa import * # noqa: F401, F403
|
2024-01-16 18:03:11 +08:00
|
|
|
from .subjective import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .summedits import * # noqa: F401, F403
|
|
|
|
from .summscreen import * # noqa: F401, F403
|
2025-03-11 19:32:08 +08:00
|
|
|
from .supergpqa import * # noqa: F401, F403
|
2023-11-22 14:54:39 +08:00
|
|
|
from .svamp import * # noqa: F401, F403
|
2023-11-03 11:15:46 +08:00
|
|
|
from .tabmwp import * # noqa: F401, F403
|
2024-04-09 17:50:23 +08:00
|
|
|
from .taco import * # noqa: F401, F403
|
2024-02-05 23:29:10 +08:00
|
|
|
from .teval import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .TheoremQA import * # noqa: F401, F403
|
|
|
|
from .tnews import * # noqa: F401, F403
|
|
|
|
from .triviaqa import * # noqa: F401, F403
|
|
|
|
from .triviaqarc import * # noqa: F401, F403
|
|
|
|
from .truthfulqa import * # noqa: F401, F403
|
2023-07-18 14:54:35 +08:00
|
|
|
from .tydiqa import * # noqa: F401, F403
|
2023-08-25 11:46:23 +08:00
|
|
|
from .wic import * # noqa: F401, F403
|
2023-12-01 14:56:54 +08:00
|
|
|
from .wikibench import * # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .winograd import * # noqa: F401, F403
|
|
|
|
from .winogrande import * # noqa: F401, F403
|
2023-09-15 15:06:53 +08:00
|
|
|
from .wnli import wnliDataset # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .wsc import * # noqa: F401, F403
|
|
|
|
from .xcopa import * # noqa: F401, F403
|
2023-08-10 14:04:18 +08:00
|
|
|
from .xiezhi import XiezhiDataset, XiezhiRetriever # noqa: F401, F403
|
2023-07-04 21:34:55 +08:00
|
|
|
from .xlsum import * # noqa: F401, F403
|
|
|
|
from .xsum import * # noqa: F401, F403
|