mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
hle biomed test
This commit is contained in:
parent
e8bc8c1e8c
commit
12597edea6
@ -3,7 +3,7 @@ from opencompass.openicl.icl_retriever import ZeroRetriever
|
|||||||
from opencompass.openicl.icl_inferencer import GenInferencer
|
from opencompass.openicl.icl_inferencer import GenInferencer
|
||||||
from opencompass.evaluator import GenericLLMEvaluator
|
from opencompass.evaluator import GenericLLMEvaluator
|
||||||
from opencompass.datasets import generic_llmjudge_postprocess
|
from opencompass.datasets import generic_llmjudge_postprocess
|
||||||
from opencompass.datasets import HLEDataset
|
from opencompass.datasets import HLEDataset_Bio_Med
|
||||||
|
|
||||||
# ----------------------------- Detailed Config -----------------------------
|
# ----------------------------- Detailed Config -----------------------------
|
||||||
|
|
||||||
@ -68,7 +68,7 @@ math_eval_cfg = dict(
|
|||||||
]),
|
]),
|
||||||
),
|
),
|
||||||
dataset_cfg=dict(
|
dataset_cfg=dict(
|
||||||
type=HLEDataset,
|
type=HLEDataset_Bio_Med,
|
||||||
path='cais/hle',
|
path='cais/hle',
|
||||||
reader_cfg=math_reader_cfg,
|
reader_cfg=math_reader_cfg,
|
||||||
),
|
),
|
||||||
@ -81,7 +81,7 @@ math_eval_cfg = dict(
|
|||||||
|
|
||||||
hle_datasets = [
|
hle_datasets = [
|
||||||
dict(
|
dict(
|
||||||
type=HLEDataset,
|
type=HLEDataset_Bio_Med,
|
||||||
abbr='hle_llmjudge',
|
abbr='hle_llmjudge',
|
||||||
path='cais/hle',
|
path='cais/hle',
|
||||||
reader_cfg=math_reader_cfg,
|
reader_cfg=math_reader_cfg,
|
||||||
|
@ -15,3 +15,17 @@ class HLEDataset(BaseDataset):
|
|||||||
dataset['test'] = dataset['test'].rename_column('question', 'problem')
|
dataset['test'] = dataset['test'].rename_column('question', 'problem')
|
||||||
dataset['train'] = dataset['test']
|
dataset['train'] = dataset['test']
|
||||||
return dataset
|
return dataset
|
||||||
|
|
||||||
|
|
||||||
|
@LOAD_DATASET.register_module()
|
||||||
|
class HLEDataset_Bio_Med(BaseDataset):
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def load(path: str):
|
||||||
|
dataset = load_dataset(path)
|
||||||
|
dataset['test'] = dataset['test'].filter(lambda x: x['image'] == '')
|
||||||
|
dataset['test'] = dataset['test'].filter(
|
||||||
|
lambda x: x['category'] == 'Biology/Medicine')
|
||||||
|
dataset['test'] = dataset['test'].rename_column('question', 'problem')
|
||||||
|
dataset['train'] = dataset['test']
|
||||||
|
return dataset
|
||||||
|
Loading…
Reference in New Issue
Block a user