hle biomed test

This commit is contained in:
Flaick 2025-04-25 10:09:33 +00:00
parent e8bc8c1e8c
commit 12597edea6
2 changed files with 17 additions and 3 deletions

View File

@ -3,7 +3,7 @@ from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import GenInferencer from opencompass.openicl.icl_inferencer import GenInferencer
from opencompass.evaluator import GenericLLMEvaluator from opencompass.evaluator import GenericLLMEvaluator
from opencompass.datasets import generic_llmjudge_postprocess from opencompass.datasets import generic_llmjudge_postprocess
from opencompass.datasets import HLEDataset from opencompass.datasets import HLEDataset_Bio_Med
# ----------------------------- Detailed Config ----------------------------- # ----------------------------- Detailed Config -----------------------------
@ -68,7 +68,7 @@ math_eval_cfg = dict(
]), ]),
), ),
dataset_cfg=dict( dataset_cfg=dict(
type=HLEDataset, type=HLEDataset_Bio_Med,
path='cais/hle', path='cais/hle',
reader_cfg=math_reader_cfg, reader_cfg=math_reader_cfg,
), ),
@ -81,7 +81,7 @@ math_eval_cfg = dict(
hle_datasets = [ hle_datasets = [
dict( dict(
type=HLEDataset, type=HLEDataset_Bio_Med,
abbr='hle_llmjudge', abbr='hle_llmjudge',
path='cais/hle', path='cais/hle',
reader_cfg=math_reader_cfg, reader_cfg=math_reader_cfg,

View File

@ -15,3 +15,17 @@ class HLEDataset(BaseDataset):
dataset['test'] = dataset['test'].rename_column('question', 'problem') dataset['test'] = dataset['test'].rename_column('question', 'problem')
dataset['train'] = dataset['test'] dataset['train'] = dataset['test']
return dataset return dataset
@LOAD_DATASET.register_module()
class HLEDataset_Bio_Med(BaseDataset):
@staticmethod
def load(path: str):
dataset = load_dataset(path)
dataset['test'] = dataset['test'].filter(lambda x: x['image'] == '')
dataset['test'] = dataset['test'].filter(
lambda x: x['category'] == 'Biology/Medicine')
dataset['test'] = dataset['test'].rename_column('question', 'problem')
dataset['train'] = dataset['test']
return dataset