mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
Add HLE dataset
This commit is contained in:
parent
34cc0a5f5f
commit
5a2462a26f
@ -399,6 +399,11 @@
|
|||||||
category: Math
|
category: Math
|
||||||
paper: https://proceedings.mlr.press/v202/gao23f/gao23f.pdf
|
paper: https://proceedings.mlr.press/v202/gao23f/gao23f.pdf
|
||||||
configpath: opencompass/configs/datasets/gsm_hard
|
configpath: opencompass/configs/datasets/gsm_hard
|
||||||
|
- hellaswag:
|
||||||
|
name: HLE
|
||||||
|
category: Reasoning
|
||||||
|
paper: https://lastexam.ai/paper
|
||||||
|
configpath: opencompass/configs/datasets/HLE
|
||||||
- hellaswag:
|
- hellaswag:
|
||||||
name: HellaSwag
|
name: HellaSwag
|
||||||
category: Reasoning
|
category: Reasoning
|
||||||
|
@ -1,4 +1,5 @@
|
|||||||
from mmengine.config import read_base
|
from mmengine.config import read_base
|
||||||
|
|
||||||
with read_base():
|
with read_base():
|
||||||
from .hle_llmjudge_gen_63a000 import hle_datasets # noqa: F401, F403
|
# Default use LLM as a judge
|
||||||
|
from .hle_llmverify_gen_6ff468 import hle_datasets # noqa: F401, F403
|
||||||
|
Loading…
Reference in New Issue
Block a user