mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
hle biomed test
This commit is contained in:
parent
e8bc8c1e8c
commit
12597edea6
@ -3,7 +3,7 @@ from opencompass.openicl.icl_retriever import ZeroRetriever
|
||||
from opencompass.openicl.icl_inferencer import GenInferencer
|
||||
from opencompass.evaluator import GenericLLMEvaluator
|
||||
from opencompass.datasets import generic_llmjudge_postprocess
|
||||
from opencompass.datasets import HLEDataset
|
||||
from opencompass.datasets import HLEDataset_Bio_Med
|
||||
|
||||
# ----------------------------- Detailed Config -----------------------------
|
||||
|
||||
@ -68,7 +68,7 @@ math_eval_cfg = dict(
|
||||
]),
|
||||
),
|
||||
dataset_cfg=dict(
|
||||
type=HLEDataset,
|
||||
type=HLEDataset_Bio_Med,
|
||||
path='cais/hle',
|
||||
reader_cfg=math_reader_cfg,
|
||||
),
|
||||
@ -81,7 +81,7 @@ math_eval_cfg = dict(
|
||||
|
||||
hle_datasets = [
|
||||
dict(
|
||||
type=HLEDataset,
|
||||
type=HLEDataset_Bio_Med,
|
||||
abbr='hle_llmjudge',
|
||||
path='cais/hle',
|
||||
reader_cfg=math_reader_cfg,
|
||||
|
@ -15,3 +15,17 @@ class HLEDataset(BaseDataset):
|
||||
dataset['test'] = dataset['test'].rename_column('question', 'problem')
|
||||
dataset['train'] = dataset['test']
|
||||
return dataset
|
||||
|
||||
|
||||
@LOAD_DATASET.register_module()
|
||||
class HLEDataset_Bio_Med(BaseDataset):
|
||||
|
||||
@staticmethod
|
||||
def load(path: str):
|
||||
dataset = load_dataset(path)
|
||||
dataset['test'] = dataset['test'].filter(lambda x: x['image'] == '')
|
||||
dataset['test'] = dataset['test'].filter(
|
||||
lambda x: x['category'] == 'Biology/Medicine')
|
||||
dataset['test'] = dataset['test'].rename_column('question', 'problem')
|
||||
dataset['train'] = dataset['test']
|
||||
return dataset
|
||||
|
Loading…
Reference in New Issue
Block a user